From ca075f2c628f5908414dbe178b62cf97d0bd5cad Mon Sep 17 00:00:00 2001 From: JinZr <60612200+JinZr@users.noreply.github.com> Date: Sat, 2 Sep 2023 16:09:19 +0800 Subject: [PATCH] minor updates --- egs/multi_zh-hans/ASR/zipformer/export.py | 10 +++---- .../ASR/zipformer/multi_dataset.py | 28 +++++++++---------- 2 files changed, 19 insertions(+), 19 deletions(-) diff --git a/egs/multi_zh-hans/ASR/zipformer/export.py b/egs/multi_zh-hans/ASR/zipformer/export.py index 9dc7cf01a..723288191 100755 --- a/egs/multi_zh-hans/ASR/zipformer/export.py +++ b/egs/multi_zh-hans/ASR/zipformer/export.py @@ -34,7 +34,7 @@ dataset, you should change the argument values according to your dataset. ./zipformer/export.py \ --exp-dir ./zipformer/exp \ --tokens data/lang_bpe_2000/tokens.txt \ - --epoch 23 \ + --epoch 20 \ --avg 1 \ --jit 1 @@ -54,7 +54,7 @@ for how to use the exported models outside of icefall. --chunk-size 16 \ --left-context-frames 128 \ --tokens data/lang_bpe_2000/tokens.txt \ - --epoch 23 \ + --epoch 20 \ --avg 1 \ --jit 1 @@ -73,7 +73,7 @@ for how to use the exported models outside of icefall. ./zipformer/export.py \ --exp-dir ./zipformer/exp \ --tokens data/lang_bpe_2000/tokens.txt \ - --epoch 23 \ + --epoch 20 \ --avg 1 - For streaming model: @@ -82,7 +82,7 @@ for how to use the exported models outside of icefall. --exp-dir ./zipformer/exp \ --causal 1 \ --tokens data/lang_bpe_2000/tokens.txt \ - --epoch 23 \ + --epoch 20 \ --avg 1 It will generate a file `pretrained.pt` in the given `exp_dir`. You can later @@ -203,7 +203,7 @@ def get_parser(): parser.add_argument( "--epoch", type=int, - default=23, + default=20, help="""It specifies the checkpoint to use for decoding. Note: Epoch counts from 1. You can specify --avg to use more checkpoints for model averaging.""", diff --git a/egs/multi_zh-hans/ASR/zipformer/multi_dataset.py b/egs/multi_zh-hans/ASR/zipformer/multi_dataset.py index e239e1135..b1920e62e 100644 --- a/egs/multi_zh-hans/ASR/zipformer/multi_dataset.py +++ b/egs/multi_zh-hans/ASR/zipformer/multi_dataset.py @@ -283,17 +283,17 @@ class MultiDataset: self.fbank_dir / "kespeech" / "kespeech-asr_cuts_dev_phase2.jsonl.gz" ) - # # WeNetSpeech - # logging.info("Loading WeNetSpeech set in lazy mode") - # wenetspeech_test_meeting_cuts = load_manifest_lazy( - # self.fbank_dir / "wenetspeech" / "cuts_TEST_MEETING.jsonl.gz" - # ) - # wenetspeech_test_net_cuts = load_manifest_lazy( - # self.fbank_dir / "wenetspeech" / "cuts_TEST_NET.jsonl.gz" - # ) - # wenetspeech_dev_cuts = load_manifest_lazy( - # self.fbank_dir / "wenetspeech" / "cuts_DEV.jsonl.gz" - # ) + # WeNetSpeech + logging.info("Loading WeNetSpeech set in lazy mode") + wenetspeech_test_meeting_cuts = load_manifest_lazy( + self.fbank_dir / "wenetspeech" / "cuts_TEST_MEETING.jsonl.gz" + ) + wenetspeech_test_net_cuts = load_manifest_lazy( + self.fbank_dir / "wenetspeech" / "cuts_TEST_NET.jsonl.gz" + ) + wenetspeech_dev_cuts = load_manifest_lazy( + self.fbank_dir / "wenetspeech" / "cuts_DEV.jsonl.gz" + ) return { "aidatatang_test": aidatatang_test_cuts, @@ -310,7 +310,7 @@ class MultiDataset: "kespeech-asr_test": kespeech_test_cuts, "kespeech-asr_dev_phase1": kespeech_dev_phase1_cuts, "kespeech-asr_dev_phase2": kespeech_dev_phase2_cuts, - # "wenetspeech-meeting_test": wenetspeech_test_meeting_cuts, - # "wenetspeech-net_test": wenetspeech_test_net_cuts, - # "wenetspeech_dev": wenetspeech_dev_cuts, + "wenetspeech-meeting_test": wenetspeech_test_meeting_cuts, + "wenetspeech-net_test": wenetspeech_test_net_cuts, + "wenetspeech_dev": wenetspeech_dev_cuts, }