modelscope · Jintao-Huang · Jul 20, 2024 · Jul 20, 2024
diff --git a/docs/source/Multi-Modal/minicpm-v-2.5最佳实践.md b/docs/source/Multi-Modal/minicpm-v-2.5最佳实践.md
@@ -160,8 +160,8 @@ road:
 
 (默认只对LLM部分的qkv进行lora微调. 如果你想对所有linear含vision模型部分都进行微调, 可以指定`--lora_target_modules ALL`. 支持全参数微调.)
 ```shell
-# Experimental environment: A100
-# 32GB GPU memory
+# Experimental environment: 3090
+# 20GB GPU memory
 CUDA_VISIBLE_DEVICES=0 swift sft \
     --model_type minicpm-v-v2_5-chat \
     --dataset coco-en-2-mini \

diff --git a/swift/llm/utils/argument.py b/swift/llm/utils/argument.py
@@ -742,7 +742,10 @@ def _prepare_target_modules(self, target_modules) -> List[str]:
             target_modules.append('DEFAULT')
         if 'DEFAULT' in target_modules:
             target_modules.remove('DEFAULT')
-            target_modules += get_default_lora_target_modules(self.model_type)
+            default_lora_tm = get_default_lora_target_modules(self.model_type)
+            if isinstance(default_lora_tm, str):
+                return default_lora_tm
+            target_modules += default_lora_tm
         if 'EMBEDDING' in target_modules:
             target_modules.remove('EMBEDDING')
             self.lora_use_embedding = True

diff --git a/swift/llm/utils/model.py b/swift/llm/utils/model.py
@@ -515,6 +515,7 @@ class LoRATM(NamedTuple):
         'kv_b_proj',
         'o_proj',
     ]
+    minicpm_llama = r'.*model\.layers\.(?:[0-9]|[12][0-9]|3[01])\.(?:self_attn\.(?:q_proj|k_proj|v_proj))'
     # compat
     llama2 = llama
 
@@ -5151,7 +5152,7 @@ def _new_forward(*args, **kwargs) -> Tensor:
 @register_model(
     ModelType.minicpm_v_v2_5_chat,
     'OpenBMB/MiniCPM-Llama3-V-2_5',
-    LoRATM.llama,
+    LoRATM.minicpm_llama,
     TemplateType.minicpm_v_v2_5,
     support_flash_attn=True,
     requires=['timm'],