diff --git a/egs/aishell/ASR/zipformer/decode_bbpe.py b/egs/aishell/ASR/zipformer/decode_bbpe.py index afb18148a..1ec10b059 100755 --- a/egs/aishell/ASR/zipformer/decode_bbpe.py +++ b/egs/aishell/ASR/zipformer/decode_bbpe.py @@ -21,30 +21,33 @@ """ Usage: (1) greedy search -./zipformer_bbpe/decode.py \ +./zipformer/decode_bbpe.py \ --epoch 35 \ --avg 15 \ - --exp-dir ./zipformer_bbpe/exp \ - --lang-dir data/lang_char \ + --exp-dir ./zipformer/exp_bbpe \ + --lang-dir data/lang_bbpe_500 \ + --bpe-model data/lang_bbpe_500/bbpe.model \ --max-duration 600 \ --decoding-method greedy_search (2) modified beam search -./zipformer_bbpe/decode.py \ +./zipformer/decode_bbpe.py \ --epoch 35 \ --avg 15 \ - --exp-dir ./zipformer_bbpe/exp \ - --lang-dir data/lang_char \ + --exp-dir ./zipformer/exp_bbpe \ + --lang-dir data/lang_bbpe_500 \ + --bpe-model data/lang_bbpe_500/bbpe.model \ --max-duration 600 \ --decoding-method modified_beam_search \ --beam-size 4 (3) fast beam search (trivial_graph) -./zipformer_bbpe/decode.py \ +./zipformer/decode_bbpe.py \ --epoch 35 \ --avg 15 \ - --exp-dir ./zipformer_bbpe/exp \ - --lang-dir data/lang_char \ + --exp-dir ./zipformer/exp_bbpe \ + --lang-dir data/lang_bbpe_500 \ + --bpe-model data/lang_bbpe_500/bbpe.model \ --max-duration 600 \ --decoding-method fast_beam_search \ --beam 20.0 \ @@ -52,11 +55,12 @@ Usage: --max-states 64 (4) fast beam search (LG) -./zipformer_bbpe/decode.py \ +./zipformer/decode_bbpe.py \ --epoch 30 \ --avg 15 \ - --exp-dir ./zipformer_bbpe/exp \ - --lang-dir data/lang_char \ + --exp-dir ./zipformer/exp_bbpe \ + --lang-dir data/lang_bbpe_500 \ + --bpe-model data/lang_bbpe_500/bbpe.model \ --max-duration 600 \ --decoding-method fast_beam_search_LG \ --beam 20.0 \ @@ -64,11 +68,12 @@ Usage: --max-states 64 (5) fast beam search (nbest oracle WER) -./zipformer_bbpe/decode.py \ +./zipformer/decode_bbpe.py \ --epoch 35 \ --avg 15 \ - --exp-dir ./zipformer_bbpe/exp \ - --lang-dir data/lang_char \ + --exp-dir ./zipformer/exp_bbpe \ + --lang-dir data/lang_bbpe_500 \ + --bpe-model data/lang_bbpe_500/bbpe.model \ --max-duration 600 \ --decoding-method fast_beam_search_nbest_oracle \ --beam 20.0 \ diff --git a/egs/aishell/ASR/zipformer/pretrained_bbpe.py b/egs/aishell/ASR/zipformer/pretrained_bbpe.py index ce4150cce..387bef98a 100755 --- a/egs/aishell/ASR/zipformer/pretrained_bbpe.py +++ b/egs/aishell/ASR/zipformer/pretrained_bbpe.py @@ -25,18 +25,18 @@ dataset, you should change the argument values according to your dataset. - For non-streaming model: -./zipformer_bbpe/export.py \ - --exp-dir ./zipformer_bbpe/exp \ - --bpe ./data/lang_bbpe_500/bbpe.model \ +./zipformer/export.py \ + --exp-dir ./zipformer/exp_bbpe \ + --tokens ./data/lang_bbpe_500/tokens.txt \ --epoch 30 \ --avg 9 - For streaming model: -./zipformer_bbpe/export.py \ - --exp-dir ./zipformer_bbpe/exp \ +./zipformer/export.py \ + --exp-dir ./zipformer/exp_bbpe \ --causal 1 \ - --bpe ./data/lang_bbpe_500/bbpe.model \ + --tokens ./data/lang_bbpe_500/tokens.txt \ --epoch 30 \ --avg 9 @@ -45,24 +45,24 @@ Usage of this script: - For non-streaming model: (1) greedy search -./zipformer_bbpe/pretrained.py \ - --checkpoint ./zipformer_bbpe/exp/pretrained.pt \ +./zipformer/pretrained_bbpe.py \ + --checkpoint ./zipformer/exp_bbpe/pretrained.pt \ --bpe ./data/lang_bbpe_500/bbpe.model \ --method greedy_search \ /path/to/foo.wav \ /path/to/bar.wav (2) modified beam search -./zipformer_bbpe/pretrained.py \ - --checkpoint ./zipformer_bbpe/exp/pretrained.pt \ +./zipformer/pretrained_bbpe.py \ + --checkpoint ./zipformer/exp_bbpe/pretrained.pt \ --bpe ./data/lang_bbpe_500/bbpe.model \ --method modified_beam_search \ /path/to/foo.wav \ /path/to/bar.wav (3) fast beam search -./zipformer_bbpe/pretrained.py \ - --checkpoint ./zipformer_bbpe/exp/pretrained.pt \ +./zipformer/pretrained_bbpe.py \ + --checkpoint ./zipformer/exp_bbpe/pretrained.pt \ --bpe ./data/lang_bbpe_500/bbpe.model \ --method fast_beam_search \ /path/to/foo.wav \ @@ -71,8 +71,8 @@ Usage of this script: - For streaming model: (1) greedy search -./zipformer_bbpe/pretrained.py \ - --checkpoint ./zipformer_bbpe/exp/pretrained.pt \ +./zipformer/pretrained_bbpe.py \ + --checkpoint ./zipformer/exp_bbpe/pretrained.pt \ --causal 1 \ --chunk-size 16 \ --left-context-frames 128 \ @@ -82,8 +82,8 @@ Usage of this script: /path/to/bar.wav (2) modified beam search -./zipformer_bbpe/pretrained.py \ - --checkpoint ./zipformer_bbpe/exp/pretrained.pt \ +./zipformer/pretrained_bbpe.py \ + --checkpoint ./zipformer/exp_bbpe/pretrained.pt \ --causal 1 \ --chunk-size 16 \ --left-context-frames 128 \ @@ -93,8 +93,8 @@ Usage of this script: /path/to/bar.wav (3) fast beam search -./zipformer_bbpe/pretrained.py \ - --checkpoint ./zipformer_bbpe/exp/pretrained.pt \ +./zipformer/pretrained_bbpe.py \ + --checkpoint ./zipformer/exp_bbpe/pretrained.pt \ --causal 1 \ --chunk-size 16 \ --left-context-frames 128 \ @@ -104,9 +104,9 @@ Usage of this script: /path/to/bar.wav -You can also use `./zipformer_bbpe/exp/epoch-xx.pt`. +You can also use `./zipformer/exp_bbpe/epoch-xx.pt`. -Note: ./zipformer_bbpe/exp/pretrained.pt is generated by ./zipformer_bbpe/export.py +Note: ./zipformer/exp_bbpe/pretrained.pt is generated by ./zipformer/export_bbpe.py """ diff --git a/egs/aishell/ASR/zipformer/train_bbpe.py b/egs/aishell/ASR/zipformer/train_bbpe.py index 77354b7f3..a2bf96b29 100755 --- a/egs/aishell/ASR/zipformer/train_bbpe.py +++ b/egs/aishell/ASR/zipformer/train_bbpe.py @@ -24,25 +24,21 @@ Usage: export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7" -./zipformer/train.py \ +./zipformer/train_bbpe.py \ --world-size 8 \ --num-epochs 12 \ --start-epoch 1 \ - --exp-dir zipformer/exp \ - --training-subset L - --lr-epochs 1.5 \ + --exp-dir zipformer/exp_bbpe \ --max-duration 350 # For mix precision training: -./zipformer/train.py \ +./zipformer/train_bbpe.py \ --world-size 8 \ --num-epochs 12 \ --start-epoch 1 \ --use-fp16 1 \ - --exp-dir zipformer/exp \ - --training-subset L \ - --lr-epochs 1.5 \ + --exp-dir zipformer/exp_bbpe \ --max-duration 750 """