from local

This commit is contained in:
dohe0342 2023-06-09 15:57:44 +09:00
parent 2c80a73107
commit 4dd1d20fd3

118
egs/tedlium3/ASR/lora.sh Executable file
View File

@ -0,0 +1,118 @@
workstation=$3
if [ $workstation = "whale" ]; then
#export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7"
export CUDA_VISIBLE_DEVICES=0
if [ ! -e ./pruned_transducer_stateless_d2v_v2/$1/.train.done ]; then
./pruned_transducer_stateless_d2v_v2/prompt_tuning.py \
--num-buckets 2 \
--add-adapter True \
--adapter-lr 0.1 \
--gender male \
--wandb False \
--input-strategy AudioSamples \
--enable-spec-aug False \
--multi-optim False \
--world-size 1 \
--num-epochs 10000 \
--num-updates 101 \
--save-every-n 50 \
--full-libri 1 \
--exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \
--max-duration 200 \
--encoder-dim 768 \
--decoder-dim 768 \
--joiner-dim 768 \
--use-fp16 0 \
--accum-grads 8 \
--encoder-type d2v \
--additional-block True \
--prune-range 10 \
--prompt True \
--spk-id $2
#touch ./pruned_transducer_stateless_d2v_v2/$1/.train.done
fi
# ./pruned_transducer_stateless_d2v_v2/train_adapter.py \
# --add-adapter True \
# --adapter-lr 0.001 \
# --gender female
# --wandb False \
# --input-strategy AudioSamples \
# --enable-spec-aug False \
# --multi-optim False \
# --world-size 8 \
# --num-epochs 10 \
# --full-libri 1 \
# --exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \
# --max-duration 200 \
# --use-fp16 0 \
# --encoder-type d2v \
# --additional-block True \
# --encoder-dim 768 \
# --decoder-dim 768 \
# --joiner-dim 768 \
# --prune-range 10
else
export CUDA_VISIBLE_DEVICES="0,1,2,3"
#rm ./pruned_transducer_stateless_d2v_v2/$1/.train.done
if [ ! -e ./pruned_transducer_stateless_d2v_v2/$1/.train.done ]; then
./pruned_transducer_stateless_d2v_v2/train_lora.py \
--num-buckets 2 \
--add-adapter True \
--adapter-lr 0.01 \
--gender male \
--wandb False \
--input-strategy AudioSamples \
--enable-spec-aug False \
--multi-optim False \
--world-size 4 \
--num-epochs 10000 \
--num-updates 101 \
--save-every-n 50 \
--full-libri 1 \
--exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \
--max-duration 150 \
--accum-grads 2 \
--encoder-dim 768 \
--decoder-dim 768 \
--joiner-dim 768 \
--use-fp16 0 \
--accum-grads 2 \
--encoder-type d2v \
--additional-block True \
--prune-range 10 \
--spk-id $2 \
--prefix vox
#touch ./pruned_transducer_stateless_d2v_v2/$1/.train.done
fi
fi
#else
# export CUDA_VISIBLE_DEVICES="0,1,2,3"
# ./pruned_transducer_stateless_d2v_v2/train_adapter.py \
# --num-buckets 2 \
# --add-adapter True \
# --adapter-lr 0.02472 \
# --wandb False \
# --input-strategy AudioSamples \
# --enable-spec-aug False \
# --multi-optim False \
# --world-size 4 \
# --num-epochs 31 \
# --full-libri 1 \
# --exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \
# --max-duration 150 \
# --encoder-dim 768 \
# --decoder-dim 768 \
# --joiner-dim 768 \
# --use-fp16 0 \
# --accum-grads 4 \
# --encoder-type d2v \
# --additional-block True \
# --prune-range 10 \
# --ctc-loss-scale 0.1924 \
# --lm-scale 0.1254 \
# --simple-loss-scale 0.2869 \
# --spk-id $2
#fi