mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-09 01:52:41 +00:00
Minor bug fixes and descriptive text for the LibriCSS
recipe (#1268)
This commit is contained in:
parent
162ceaf4b3
commit
eeeeef390b
@ -90,6 +90,14 @@ if [ $stage -le 1 ] && [ $stop_stage -ge 1 ]; then
|
|||||||
# NOTE: Alignments are required for this recipe.
|
# NOTE: Alignments are required for this recipe.
|
||||||
mkdir -p data/manifests
|
mkdir -p data/manifests
|
||||||
|
|
||||||
|
log "This recipe uses mfa alignment for trimming"
|
||||||
|
if [ ! -d $dl_dir/libri_alignments/LibriSpeech ]; then
|
||||||
|
log "No alignment provided. please refer to ../../librispeech/ASR/add_alignments.sh \n \
|
||||||
|
for mfa alignments. Once you have downloaded and unzipped the .zip file containing \n \
|
||||||
|
all alignments, the folder should be renamed to libri_alignments and moved to your $dl_dir ."
|
||||||
|
exit 0
|
||||||
|
fi
|
||||||
|
|
||||||
lhotse prepare librispeech -p train-clean-100 -p train-clean-360 -p train-other-500 -p dev-clean \
|
lhotse prepare librispeech -p train-clean-100 -p train-clean-360 -p train-other-500 -p dev-clean \
|
||||||
-j 4 --alignments-dir $dl_dir/libri_alignments/LibriSpeech $dl_dir/librispeech data/manifests/
|
-j 4 --alignments-dir $dl_dir/libri_alignments/LibriSpeech $dl_dir/librispeech data/manifests/
|
||||||
fi
|
fi
|
||||||
@ -118,9 +126,12 @@ fi
|
|||||||
|
|
||||||
if [ $stage -le 4 ] && [ $stop_stage -ge 4 ]; then
|
if [ $stage -le 4 ] && [ $stop_stage -ge 4 ]; then
|
||||||
log "Stage 4: Extract features for LibriSpeech, trim to alignments, and shuffle the cuts"
|
log "Stage 4: Extract features for LibriSpeech, trim to alignments, and shuffle the cuts"
|
||||||
python local/compute_fbank_librispeech.py
|
# python local/compute_fbank_librispeech.py
|
||||||
lhotse combine data/manifests/librispeech_cuts_train* - |\
|
lhotse combine data/manifests/librispeech_cuts_train* data/manifests/librispeech_cuts_train_all.jsonl.gz
|
||||||
lhotse cut trim-to-alignments --type word --max-pause 0.2 - - |\
|
lhotse cut trim-to-alignments --type word --max-pause 0.2 \
|
||||||
|
data/manifests/librispeech_cuts_train_all.jsonl.gz \
|
||||||
|
data/manifests/librispeech_cuts_train_all_trimmed.jsonl.gz
|
||||||
|
cat <(gunzip -c data/manifests/librispeech_cuts_train_all_trimmed.jsonl.gz) | \
|
||||||
shuf | gzip -c > data/manifests/librispeech_cuts_train_trimmed.jsonl.gz
|
shuf | gzip -c > data/manifests/librispeech_cuts_train_trimmed.jsonl.gz
|
||||||
fi
|
fi
|
||||||
|
|
||||||
@ -152,7 +163,7 @@ if [ $stage -le 5 ] && [ $stop_stage -ge 5 ]; then
|
|||||||
data/manifests/lsmix_cuts_train_clean_ov40.jsonl.gz
|
data/manifests/lsmix_cuts_train_clean_ov40.jsonl.gz
|
||||||
|
|
||||||
# Full training set (2,3 speakers) anechoic
|
# Full training set (2,3 speakers) anechoic
|
||||||
log "Generating anechoic ${part} set (full)"
|
log "Generating anechoic set (full)"
|
||||||
lhotse workflows simulate-meetings \
|
lhotse workflows simulate-meetings \
|
||||||
--method conversational \
|
--method conversational \
|
||||||
--fit-to-supervisions data/manifests/libricss-sdm_supervisions_all_v1.jsonl.gz \
|
--fit-to-supervisions data/manifests/libricss-sdm_supervisions_all_v1.jsonl.gz \
|
||||||
|
Loading…
x
Reference in New Issue
Block a user