From 97868edfbb27976d5ddd340b743a61f124b43fbe Mon Sep 17 00:00:00 2001 From: rickychanhoyin Date: Fri, 19 Aug 2022 23:36:23 +0800 Subject: [PATCH 1/4] Update asr_datamodule.py minor file names correction --- egs/timit/ASR/tdnn_lstm_ctc/asr_datamodule.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/egs/timit/ASR/tdnn_lstm_ctc/asr_datamodule.py b/egs/timit/ASR/tdnn_lstm_ctc/asr_datamodule.py index 5e2923fb6..1554e987f 100644 --- a/egs/timit/ASR/tdnn_lstm_ctc/asr_datamodule.py +++ b/egs/timit/ASR/tdnn_lstm_ctc/asr_datamodule.py @@ -155,7 +155,7 @@ class TimitAsrDataModule(DataModule): logging.info("About to get Musan cuts") cuts_musan = load_manifest( - self.args.feature_dir / "cuts_musan.jsonl.gz" + self.args.feature_dir / "musan_cuts.jsonl.gz" ) logging.info("About to create train dataset") From 215c4bde1584fe80bed11be46b8103d431506188 Mon Sep 17 00:00:00 2001 From: rickychanhoyin Date: Sat, 27 Aug 2022 16:39:05 +0800 Subject: [PATCH 2/4] minor changes for correct path names && import module text2segments.py --- egs/alimeeting/ASR/local/compute_fbank_alimeeting.py | 2 +- egs/alimeeting/ASR/local/text2segments.py | 2 ++ egs/alimeeting/ASR/prepare.sh | 2 +- 3 files changed, 4 insertions(+), 2 deletions(-) diff --git a/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py b/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py index 2ff473c60..eb3acbbea 100755 --- a/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py +++ b/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py @@ -43,7 +43,7 @@ torch.set_num_interop_threads(1) def compute_fbank_alimeeting(num_mel_bins: int = 80): - src_dir = Path("data/manifests") + src_dir = Path("data/manifests/alimeeting") output_dir = Path("data/fbank") num_jobs = min(15, os.cpu_count()) diff --git a/egs/alimeeting/ASR/local/text2segments.py b/egs/alimeeting/ASR/local/text2segments.py index 3df727c67..7c1019aa8 100644 --- a/egs/alimeeting/ASR/local/text2segments.py +++ b/egs/alimeeting/ASR/local/text2segments.py @@ -30,9 +30,11 @@ with word segmenting: import argparse +import paddle import jieba from tqdm import tqdm +paddle.enable_static() jieba.enable_paddle() diff --git a/egs/alimeeting/ASR/prepare.sh b/egs/alimeeting/ASR/prepare.sh index eb2ac697d..17224bb68 100755 --- a/egs/alimeeting/ASR/prepare.sh +++ b/egs/alimeeting/ASR/prepare.sh @@ -107,7 +107,7 @@ if [ $stage -le 6 ] && [ $stop_stage -ge 6 ]; then # Prepare text. # Note: in Linux, you can install jq with the following command: # wget -O jq https://github.com/stedolan/jq/releases/download/jq-1.6/jq-linux64 - gunzip -c data/manifests/alimeeting/supervisions_train.jsonl.gz \ + gunzip -c data/manifests/alimeeting/alimeeting_supervisions_train.jsonl.gz \ | jq ".text" | sed 's/"//g' \ | ./local/text2token.py -t "char" > $lang_char_dir/text From 862e817442e658841443c0f6e232e1ad69582e4b Mon Sep 17 00:00:00 2001 From: rickychanhoyin Date: Wed, 31 Aug 2022 13:12:28 +0800 Subject: [PATCH 3/4] Very minor change in alimeeting recipe No need to load_audio. alimeeting audio data is wav format, default export_to_webdataset uses "flac". If load_audio uses default (True), webdataset would show "[Suppressed TypeError] Error message: save() got an unexpected keyword argument 'format'" during write --- egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py b/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py index 65fc74728..9bd6c7df2 100755 --- a/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py +++ b/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py @@ -551,6 +551,7 @@ def main(): dev_cuts, output_path=f"{dev}/shared-%d.tar", shard_size=300, + load_audio=False, ) if not os.path.exists(f"{test}/shared-0.tar"): @@ -560,6 +561,7 @@ def main(): test_cuts, output_path=f"{test}/shared-%d.tar", shard_size=300, + load_audio=False, ) dev_shards = [ From fb90ada9e86084926f228eaeb8e41287c50fc1cf Mon Sep 17 00:00:00 2001 From: rickychanhoyin Date: Wed, 31 Aug 2022 13:45:35 +0800 Subject: [PATCH 4/4] remove trailing white space --- egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py b/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py index 9bd6c7df2..455652b65 100755 --- a/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py +++ b/egs/alimeeting/ASR/pruned_transducer_stateless2/decode.py @@ -551,7 +551,7 @@ def main(): dev_cuts, output_path=f"{dev}/shared-%d.tar", shard_size=300, - load_audio=False, + load_audio=False, ) if not os.path.exists(f"{test}/shared-0.tar"):