qwen_train #2
1
.gitignore
vendored
1
.gitignore
vendored
@ -8,3 +8,4 @@ models
|
|||||||
*.log
|
*.log
|
||||||
research_notebook/data
|
research_notebook/data
|
||||||
train/qwen/output
|
train/qwen/output
|
||||||
|
train/qwen/mlruns
|
||||||
|
|||||||
@ -3,6 +3,7 @@
|
|||||||
|
|
||||||
nproc_per_node=1
|
nproc_per_node=1
|
||||||
|
|
||||||
|
MLFLOW_TRACKING_URI=http://0.0.0.0:5004 \
|
||||||
INFONCE_USE_BATCH=False \
|
INFONCE_USE_BATCH=False \
|
||||||
CUDA_VISIBLE_DEVICES=0 \
|
CUDA_VISIBLE_DEVICES=0 \
|
||||||
NPROC_PER_NODE=$nproc_per_node \
|
NPROC_PER_NODE=$nproc_per_node \
|
||||||
@ -30,4 +31,5 @@ swift sft \
|
|||||||
--loss_type infonce \
|
--loss_type infonce \
|
||||||
--label_names labels \
|
--label_names labels \
|
||||||
--dataloader_drop_last true \
|
--dataloader_drop_last true \
|
||||||
--deepspeed zero3
|
--deepspeed zero3 \
|
||||||
|
--report_to mlflow
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user