mirror of
https://gitee.com/mindspore/mindformers.git
synced 2025-12-06 11:29:59 +08:00
!7790 【master】【bug-fix】解决q_lora_rank为None时,跑推理任务权重加载不上的问题
Merge pull request !7790 from zhouxq/weight_q_lora_rank_master
This commit is contained in:
@@ -195,7 +195,7 @@ class InferModelMixin(ModelMixin):
|
||||
def _safetensors_weights_iterator(self, weights_files: List[str]) -> Generator[Tuple[str, Any], None, None]:
|
||||
"""Iterate over the weights in the model safetensor files."""
|
||||
rank_id = get_tensor_model_parallel_rank()
|
||||
is_main_rank = (rank_id == 0)
|
||||
is_main_rank = rank_id == 0
|
||||
for st_file in tqdm(
|
||||
weights_files,
|
||||
desc=f"[Rank {rank_id}] Loading safetensors checkpoint shards",
|
||||
@@ -236,7 +236,9 @@ class InferModelMixin(ModelMixin):
|
||||
"""
|
||||
mapping_rules = {
|
||||
'.linear_q_down_proj.': ('.linear_qkv_down_proj.', '.linear_q_down_proj.', 'q_down'),
|
||||
'.linear_kv_down_proj.': ('.linear_qkv_down_proj.', '.linear_kv_down_proj.', 'kv_down'),
|
||||
'.linear_kv_down_proj.': ('.linear_qkv_down_proj.', '.linear_kv_down_proj.', 'kv_down')
|
||||
if getattr(self.config, 'q_lora_rank', None) is not None else
|
||||
('.linear_kv_down_proj.', '.linear_kv_down_proj.', 'kv_down'),
|
||||
'.linear_q_up_proj.': ('.linear_q_up_proj.', '.linear_q_up_proj.', 'q_up'),
|
||||
'.linear_kv_up_proj.': ('.linear_kv_up_proj.', '.linear_kv_up_proj.', 'kv_up'),
|
||||
'.linear_q.': ('.linear_qkv.', '.linear_q.', 'q'),
|
||||
|
||||
Reference in New Issue
Block a user