From ec3366692c3c62cea3dca5ea2e6043a65df11a86 Mon Sep 17 00:00:00 2001 From: dohe0342 Date: Tue, 24 Jan 2023 13:58:40 +0900 Subject: [PATCH] from local --- egs/LJSpeech/ASR/.run_ad.swp | Bin 4096 -> 0 bytes egs/LJSpeech/ASR/run_adapter.sh | 75 ++++++++++++++++++++++++++++++++ 2 files changed, 75 insertions(+) delete mode 100644 egs/LJSpeech/ASR/.run_ad.swp create mode 100755 egs/LJSpeech/ASR/run_adapter.sh diff --git a/egs/LJSpeech/ASR/.run_ad.swp b/egs/LJSpeech/ASR/.run_ad.swp deleted file mode 100644 index 4b86d1d3ee1f9bfe5e1fd2dd350dd445cf2b7258..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 4096 zcmYc?2=nw+u+%eP00IFJ0RauH3=Apx8L0-wCPpwZT(k>NU218ju5V(pQ+|GSKvBM4 zPJVJ?4!Zg}n1TA``9;~q1&PV2`kBe8X^A;G`l;!~`aWL41*xgY8TyXFLHb3ddGU!U z=thk4M?+vV1jr5nUIt?$LvU7CR#H?D778WXq*0BdAut*OqaiRF0;3@?8UmvsFd71* LAut*OLoWmX+A$(2 diff --git a/egs/LJSpeech/ASR/run_adapter.sh b/egs/LJSpeech/ASR/run_adapter.sh new file mode 100755 index 000000000..ccfb8bd95 --- /dev/null +++ b/egs/LJSpeech/ASR/run_adapter.sh @@ -0,0 +1,75 @@ +git pull + +workstation="bear" + +if [ $workstation = "whale" ]; then + export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" + ./pruned_transducer_stateless_d2v_v2/train_adapter.py \ + --add-adapter True \ + --adapter-lr 0.001 \ + --gender male \ + --wandb False \ + --input-strategy AudioSamples \ + --enable-spec-aug False \ + --multi-optim False \ + --world-size 8 \ + --num-epochs 10 \ + --full-libri 1 \ + --exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \ + --max-duration 200 \ + --encoder-dim 768 \ + --decoder-dim 768 \ + --joiner-dim 768 \ + --use-fp16 0 \ + --accum-grads 1 \ + --encoder-type d2v \ + --additional-block True \ + --prune-range 10 + +# ./pruned_transducer_stateless_d2v_v2/train_adapter.py \ +# --add-adapter True \ +# --adapter-lr 0.001 \ +# --gender female +# --wandb False \ +# --input-strategy AudioSamples \ +# --enable-spec-aug False \ +# --multi-optim False \ +# --world-size 8 \ +# --num-epochs 10 \ +# --full-libri 1 \ +# --exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \ +# --max-duration 200 \ +# --use-fp16 0 \ +# --encoder-type d2v \ +# --additional-block True \ +# --encoder-dim 768 \ +# --decoder-dim 768 \ +# --joiner-dim 768 \ +# --prune-range 10 +else + export CUDA_VISIBLE_DEVICES="0,1,2,3" + ./pruned_transducer_stateless_d2v_v2/train_adapter.py \ + --add-adapter True \ + --adapter-lr 0.02472 \ + --gender male \ + --wandb True \ + --input-strategy AudioSamples \ + --enable-spec-aug False \ + --multi-optim False \ + --world-size 4 \ + --num-epochs 10 \ + --full-libri 1 \ + --exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \ + --max-duration 150 \ + --encoder-dim 768 \ + --decoder-dim 768 \ + --joiner-dim 768 \ + --use-fp16 0 \ + --accum-grads 4 \ + --encoder-type d2v \ + --additional-block True \ + --prune-range 10 \ + --ctc-loss-scale 0.1924 \ + --lm-scale 0.1254 \ + --simple-loss-scale 0.2869 +fi