mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-09 10:02:22 +00:00
* Add utility for shallow fusion * test batch size == 1 without shallow fusion * Use shallow fusion for modified-beam-search * Modified beam search with ngram rescoring * Fix code according to review Co-authored-by: Fangjun Kuang <csukuangfj@gmail.com>
21 lines
533 B
Bash
Executable File
21 lines
533 B
Bash
Executable File
#!/usr/bin/env bash
|
|
|
|
lang_dir=data/lang_bpe_500
|
|
|
|
for ngram in 2 3 5; do
|
|
if [ ! -f $lang_dir/${ngram}gram.arpa ]; then
|
|
./shared/make_kn_lm.py \
|
|
-ngram-order ${ngram} \
|
|
-text $lang_dir/transcript_tokens.txt \
|
|
-lm $lang_dir/${ngram}gram.arpa
|
|
fi
|
|
|
|
if [ ! -f $lang_dir/${ngram}gram.fst.txt ]; then
|
|
python3 -m kaldilm \
|
|
--read-symbol-table="$lang_dir/tokens.txt" \
|
|
--disambig-symbol='#0' \
|
|
--max-order=${ngram} \
|
|
$lang_dir/${ngram}gram.arpa > $lang_dir/${ngram}gram.fst.txt
|
|
fi
|
|
done
|