mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-26 10:16:14 +00:00
minor updates
This commit is contained in:
parent
32a7d2222d
commit
f0744877a6
1
egs/libritts/ASR/local/compile_hlg.py
Symbolic link
1
egs/libritts/ASR/local/compile_hlg.py
Symbolic link
@ -0,0 +1 @@
|
|||||||
|
../../../librispeech/ASR/local/compile_hlg.py
|
1
egs/libritts/ASR/local/compile_lg.py
Symbolic link
1
egs/libritts/ASR/local/compile_lg.py
Symbolic link
@ -0,0 +1 @@
|
|||||||
|
../../../librispeech/ASR/local/compile_lg.py
|
@ -126,25 +126,25 @@ fi
|
|||||||
if [ $stage -le 5 ] && [ $stop_stage -ge 5 ]; then
|
if [ $stage -le 5 ] && [ $stop_stage -ge 5 ]; then
|
||||||
log "Stage 5: Train BPE model for normalized text"
|
log "Stage 5: Train BPE model for normalized text"
|
||||||
|
|
||||||
if [ ! -f data/texts ]; then
|
if [ ! -f data/text ]; then
|
||||||
gunzip -c data/manifests/libritts_supervisions_train-clean-100.jsonl.gz \
|
gunzip -c data/manifests/libritts_supervisions_train-clean-100.jsonl.gz \
|
||||||
| jq ".text" | sed 's/"//g' \
|
| jq ".text" | sed 's/"//g' \
|
||||||
| ./local/norm_text.py > data/texts
|
| ./local/norm_text.py > data/text
|
||||||
|
|
||||||
gunzip -c data/manifests/libritts_supervisions_train-clean-360.jsonl.gz \
|
gunzip -c data/manifests/libritts_supervisions_train-clean-360.jsonl.gz \
|
||||||
| jq ".text" | sed 's/"//g' \
|
| jq ".text" | sed 's/"//g' \
|
||||||
| ./local/norm_text.py >> data/texts
|
| ./local/norm_text.py >> data/text
|
||||||
|
|
||||||
gunzip -c data/manifests/libritts_supervisions_train-other-500.jsonl.gz \
|
gunzip -c data/manifests/libritts_supervisions_train-other-500.jsonl.gz \
|
||||||
| jq ".text" | sed 's/"//g' \
|
| jq ".text" | sed 's/"//g' \
|
||||||
| ./local/norm_text.py >> data/texts
|
| ./local/norm_text.py >> data/text
|
||||||
fi
|
fi
|
||||||
|
|
||||||
for vocab_size in ${vocab_sizes[@]}; do
|
for vocab_size in ${vocab_sizes[@]}; do
|
||||||
lang_dir=data/lang_bpe_${vocab_size}
|
lang_dir=data/lang_bpe_${vocab_size}
|
||||||
mkdir -p $lang_dir
|
mkdir -p $lang_dir
|
||||||
|
|
||||||
cp data/texts $lang_dir/text
|
cp data/text $lang_dir/text
|
||||||
|
|
||||||
if [ ! -f $lang_dir/bpe.model ]; then
|
if [ ! -f $lang_dir/bpe.model ]; then
|
||||||
./local/train_bpe_model.py \
|
./local/train_bpe_model.py \
|
||||||
|
1
egs/libritts/ASR/zipformer/decoder.py
Symbolic link
1
egs/libritts/ASR/zipformer/decoder.py
Symbolic link
@ -0,0 +1 @@
|
|||||||
|
../../../librispeech/ASR/zipformer/decoder.py
|
@ -1351,8 +1351,8 @@ def run(rank, world_size, args):
|
|||||||
|
|
||||||
return True
|
return True
|
||||||
|
|
||||||
train_cuts = train_cuts.filter(remove_short_and_long_utt)
|
|
||||||
train_cuts = train_cuts.map(normalize_text)
|
train_cuts = train_cuts.map(normalize_text)
|
||||||
|
train_cuts = train_cuts.filter(remove_short_and_long_utt)
|
||||||
|
|
||||||
if params.start_batch > 0 and checkpoints and "sampler" in checkpoints:
|
if params.start_batch > 0 and checkpoints and "sampler" in checkpoints:
|
||||||
# We only load the sampler's state dict when it loads a checkpoint
|
# We only load the sampler's state dict when it loads a checkpoint
|
||||||
|
Loading…
x
Reference in New Issue
Block a user