From 1e4f4ccb4787c2baf924a31fbec3f64413744658 Mon Sep 17 00:00:00 2001 From: dohe0342 Date: Tue, 24 Jan 2023 15:55:18 +0900 Subject: [PATCH] from local --- egs/LJSpeech/ASR/.test.sh.swp | Bin 12288 -> 12288 bytes .../run_v3.sh | 57 ++++++++++++++++++ 2 files changed, 57 insertions(+) create mode 100755 egs/LJSpeech/ASR/pruned_transducer_stateless_d2v_v2/run_v3.sh diff --git a/egs/LJSpeech/ASR/.test.sh.swp b/egs/LJSpeech/ASR/.test.sh.swp index 2c798f8de14ed3044a44336db58297c9ae9c6e07..8f5eee277ac68654caaba3680ad5873a181b5a24 100644 GIT binary patch delta 31 lcmZojXh;xCG6?hZRj|}EU;qLE28NsU=ab`;Hj2H{2LOl*2}b|` delta 31 lcmZojXh;xCG6?hZRj|}EU;qLE1_tf=^U39j8^vDf0|0@_2(SPE diff --git a/egs/LJSpeech/ASR/pruned_transducer_stateless_d2v_v2/run_v3.sh b/egs/LJSpeech/ASR/pruned_transducer_stateless_d2v_v2/run_v3.sh new file mode 100755 index 000000000..90a639ed5 --- /dev/null +++ b/egs/LJSpeech/ASR/pruned_transducer_stateless_d2v_v2/run_v3.sh @@ -0,0 +1,57 @@ +git pull + +workstation="bear" + +if [ $workstation = "whale" ]; then + export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" + ./pruned_transducer_stateless_d2v_v2/train.py \ + --wandb true \ + --input-strategy AudioSamples \ + --enable-spec-aug False \ + --multi-optim True \ + --world-size 8 \ + --num-epochs 30 \ + --start-epoch 1 \ + --full-libri 1 \ + --exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \ + --max-duration 250 \ + --freeze-finetune-updates 2000 \ + --use-fp16 1 \ + --peak-enc-lr 0.03 \ + --peak-dec-lr 0.1 \ + --accum-grads 1 \ + --encoder-type d2v \ + --additional-block True \ + --encoder-dim 768 \ + --decoder-dim 768 \ + --joiner-dim 768 \ + --prune-range 10 \ + --context-size 2 \ + --ctc-loss-scale 0.2 +else + export CUDA_VISIBLE_DEVICES="0,1,2,3" + ./pruned_transducer_stateless_d2v_v2/train.py \ + --wandb False \ + --input-strategy AudioSamples \ + --enable-spec-aug False \ + --multi-optim False \ + --start-epoch 28 \ + --world-size 4 \ + --num-epochs 30 \ + --full-libri 1 \ + --exp-dir ./pruned_transducer_stateless_d2v_v2/$1 \ + --max-duration 150 \ + --freeze-finetune-updates 3000 \ + --encoder-dim 768 \ + --decoder-dim 768 \ + --joiner-dim 768 \ + --use-fp16 0 \ + --peak-dec-lr 0.04175 \ + --peak-enc-lr 0.0003859 \ + --accum-grads 4 \ + --encoder-type d2v \ + --additional-block True \ + --prune-range 10 \ + --context-size 2 \ + --ctc-loss-scale 0.2 +fi