diff --git a/egs/tedlium2/ASR/conformer_ctc3/.train.py.swp b/egs/tedlium2/ASR/conformer_ctc3/.train.py.swp index ec4acc63d..7744b5032 100644 Binary files a/egs/tedlium2/ASR/conformer_ctc3/.train.py.swp and b/egs/tedlium2/ASR/conformer_ctc3/.train.py.swp differ diff --git a/egs/tedlium2/ASR/conformer_ctc3/train.py b/egs/tedlium2/ASR/conformer_ctc3/train.py index a6884896a..5cda80235 100755 --- a/egs/tedlium2/ASR/conformer_ctc3/train.py +++ b/egs/tedlium2/ASR/conformer_ctc3/train.py @@ -308,8 +308,6 @@ def get_parser() -> argparse.ArgumentParser: "--interctc-weight", type=float, default=0.3, - help="""Number of steps that affects how rapidly the learning rate - decreases. We suggest not to change this.""", ) add_model_arguments(parser) @@ -565,13 +563,13 @@ def compute_loss( allow_truncate=params.subsampling_factor - 1, ) - ctc_loss = 0.7* k2.ctc_loss( + ctc_loss = (1-params.interctc_weight)* k2.ctc_loss( decoding_graph=decoding_graph, dense_fsa_vec=dense_fsa_vec1, output_beam=params.beam_size, reduction=params.reduction, use_double_scores=params.use_double_scores, - ) + 0.3 * k2.ctc_loss( + ) + params.interctc_weight * k2.ctc_loss( decoding_graph=decoding_graph, dense_fsa_vec=dense_fsa_vec2, output_beam=params.beam_size,