qwen_train #2

Merged
alavi_team_user2 merged 4 commits from qwen_train into main 2025-11-23 10:54:27 +00:00
2 changed files with 4 additions and 1 deletions
Showing only changes of commit 7c945a1603 - Show all commits

1
.gitignore vendored
View File

@ -8,3 +8,4 @@ models
*.log
research_notebook/data
train/qwen/output
train/qwen/mlruns

View File

@ -3,6 +3,7 @@
nproc_per_node=1
MLFLOW_TRACKING_URI=http://0.0.0.0:5004 \
INFONCE_USE_BATCH=False \
CUDA_VISIBLE_DEVICES=0 \
NPROC_PER_NODE=$nproc_per_node \
@ -30,4 +31,5 @@ swift sft \
--loss_type infonce \
--label_names labels \
--dataloader_drop_last true \
--deepspeed zero3
--deepspeed zero3 \
--report_to mlflow