diff --git a/egs/librispeech/ASR/.run_v2.sh.swp b/egs/librispeech/ASR/.run_v2.sh.swp index 57b240499..d7bfe9141 100644 Binary files a/egs/librispeech/ASR/.run_v2.sh.swp and b/egs/librispeech/ASR/.run_v2.sh.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp index 4aebbefce..d65d2ca3c 100644 Binary files a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp and b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp differ diff --git a/egs/librispeech/ASR/run_v2.sh b/egs/librispeech/ASR/run_v2.sh index f4dc74130..45bc87414 100755 --- a/egs/librispeech/ASR/run_v2.sh +++ b/egs/librispeech/ASR/run_v2.sh @@ -3,12 +3,14 @@ export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" git pull ./pruned_transducer_stateless_d2v_v2/train.py \ - --world-size 8 \ - --num-epochs 30 \ - --full-libri 1 \ - --use-fp16 1 \ - --max-duration 300 \ - --exp-dir pruned_transducer_stateless_d2v_v2/exp \ - --feedforward-dims "1024,1024,2048,2048,1024" \ - --ctc-loss-scale 0.2 \ - --master-port 12535 + --input-strategy AudioSamples \ + --enable-spec-aug False \ + --world-size 8 \ + --num-epochs 30 \ + --full-libri 1 \ + --use-fp16 1 \ + --max-duration 300 \ + --exp-dir pruned_transducer_stateless_d2v_v2/exp \ + --feedforward-dims "1024,1024,2048,2048,1024" \ + --ctc-loss-scale 0.2 \ + --master-port 12535