feat✨: 更新训练脚本以支持新的lora_target_modules和输出目录，优化训练配置

2025-05-30 19:14:34 +08:00
parent baccca420a
commit b84ebb03c7
2 changed files with 79 additions and 717 deletions
@@ -5,14 +5,14 @@ accelerate launch --config_file configs/accelerate_configs/deepspeed_zero1.yaml
    --use_peft \
    --peft_type MOELORA \
    --model_name_or_path Qwen/Qwen2.5-Omni-3B \
-    --lora_target_modules .*model\.layers.*proj \
+    --lora_target_modules .*model\.layers.*proj\|.*merger.*0\|.*merger.*1 \
    --lora_r 8 \
    --lora_alpha 32 \
    --per_device_train_batch_size 3 \
    --per_device_eval_batch_size 1 \
    --gradient_accumulation_steps 2 \
    --num_train_epochs 1 \
-    --output_dir checkpoint/qwen2_alllinear/ \
+    --output_dir checkpoint/qwen2_5omni_moelora/ \
    --learning_rate 2e-4 \
    --warmup_ratio 0.03 \
    --lr_scheduler_type cosine \
@@ -21,4 +21,4 @@ accelerate launch --config_file configs/accelerate_configs/deepspeed_zero1.yaml
    --logging_steps 10 \
    --gradient_checkpointing \
    --weight_decay 0.1 \
-    --resume_from_checkpoint /root/autodl-tmp/zhouyunyao/projects/CL-LMM/src/checkpoint/qwen2_alllinear/checkpoint-1000
+    # --resume_from_checkpoint /root/autodl-tmp/zhouyunyao/projects/CL-LMM/src/checkpoint/qwen2_alllinear/checkpoint-1000