Skip to content

Commit

Permalink
fix: intxweigtht -> wxa16, b_ready_cache_len -> infer_state.b_ready_c… (
Browse files Browse the repository at this point in the history
#371)

…ache_len

Co-authored-by: wanzihao <[email protected]>
  • Loading branch information
WANDY666 and wanzihao authored Mar 21, 2024
1 parent c3dc640 commit 755c4fd
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions lightllm/common/basemodel/basemodel.py
Original file line number Diff line number Diff line change
Expand Up @@ -38,7 +38,7 @@ def __init__(self, kvargs):
self.weight_dir_ = kvargs["weight_dir"]
self.max_total_token_num = kvargs["max_total_token_num"]
self.load_way = kvargs.get("load_way", "HF")
self.mode = kvargs.get("mode", [])
self.mode = [m.replace('int4weight', 'w4a16').replace('int8weight', 'w8a16') for m in kvargs.get("mode", [])]
self.weight_dict = kvargs.get("weight_dict", None)
self.finetune_config = kvargs.get("finetune_config", None)
self.max_req_num = kvargs.get("max_req_num", 1000)
Expand Down Expand Up @@ -231,7 +231,7 @@ def _prefill(
self.req_manager.req_to_token_indexs,
b_req_idx,
b_seq_len,
b_ready_cache_len,
infer_state.b_ready_cache_len,
max_len_in_batch,
infer_state.mem_index,
)
Expand Down

0 comments on commit 755c4fd

Please sign in to comment.