From 2636a3dd58301191af0a5bca06088544e91c450c Mon Sep 17 00:00:00 2001 From: rickychanhoyin Date: Sat, 27 Aug 2022 17:23:45 +0800 Subject: [PATCH] minor changes for correct path names && import module text2segments.py (#552) * Update asr_datamodule.py minor file names correction * minor changes for correct path names && import module text2segments.py --- egs/alimeeting/ASR/local/compute_fbank_alimeeting.py | 2 +- egs/alimeeting/ASR/local/text2segments.py | 2 ++ egs/alimeeting/ASR/prepare.sh | 2 +- 3 files changed, 4 insertions(+), 2 deletions(-) diff --git a/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py b/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py index 2ff473c60..eb3acbbea 100755 --- a/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py +++ b/egs/alimeeting/ASR/local/compute_fbank_alimeeting.py @@ -43,7 +43,7 @@ torch.set_num_interop_threads(1) def compute_fbank_alimeeting(num_mel_bins: int = 80): - src_dir = Path("data/manifests") + src_dir = Path("data/manifests/alimeeting") output_dir = Path("data/fbank") num_jobs = min(15, os.cpu_count()) diff --git a/egs/alimeeting/ASR/local/text2segments.py b/egs/alimeeting/ASR/local/text2segments.py index 3df727c67..7c1019aa8 100644 --- a/egs/alimeeting/ASR/local/text2segments.py +++ b/egs/alimeeting/ASR/local/text2segments.py @@ -30,9 +30,11 @@ with word segmenting: import argparse +import paddle import jieba from tqdm import tqdm +paddle.enable_static() jieba.enable_paddle() diff --git a/egs/alimeeting/ASR/prepare.sh b/egs/alimeeting/ASR/prepare.sh index eb2ac697d..17224bb68 100755 --- a/egs/alimeeting/ASR/prepare.sh +++ b/egs/alimeeting/ASR/prepare.sh @@ -107,7 +107,7 @@ if [ $stage -le 6 ] && [ $stop_stage -ge 6 ]; then # Prepare text. # Note: in Linux, you can install jq with the following command: # wget -O jq https://github.com/stedolan/jq/releases/download/jq-1.6/jq-linux64 - gunzip -c data/manifests/alimeeting/supervisions_train.jsonl.gz \ + gunzip -c data/manifests/alimeeting/alimeeting_supervisions_train.jsonl.gz \ | jq ".text" | sed 's/"//g' \ | ./local/text2token.py -t "char" > $lang_char_dir/text