diff --git a/egs/librispeech/ASR/transducer_stateless/conformer.py b/egs/librispeech/ASR/transducer_stateless/conformer.py index 7b9aff71f..fa25e6ca0 100644 --- a/egs/librispeech/ASR/transducer_stateless/conformer.py +++ b/egs/librispeech/ASR/transducer_stateless/conformer.py @@ -160,7 +160,7 @@ class ConformerEncoderLayer(nn.Module): nn.Linear(d_model, dim_feedforward), DerivBalancer(channel_dim=-1, threshold=0.05, max_factor=0.01), - SwishExpScale(dim_feedforward, speed=20.0, in_scale=0.5), + SwishExpScale(dim_feedforward, speed=20.0, in_scale=2.0), nn.Dropout(dropout), nn.Linear(dim_feedforward, d_model), ) @@ -169,7 +169,7 @@ class ConformerEncoderLayer(nn.Module): nn.Linear(d_model, dim_feedforward), DerivBalancer(channel_dim=-1, threshold=0.05, max_factor=0.01), - SwishExpScale(dim_feedforward, speed=20.0, in_scale=0.5), + SwishExpScale(dim_feedforward, speed=20.0, in_scale=2.0), nn.Dropout(dropout), nn.Linear(dim_feedforward, d_model), ) diff --git a/egs/librispeech/ASR/transducer_stateless/train.py b/egs/librispeech/ASR/transducer_stateless/train.py index 190406491..c72a9dd28 100755 --- a/egs/librispeech/ASR/transducer_stateless/train.py +++ b/egs/librispeech/ASR/transducer_stateless/train.py @@ -110,7 +110,7 @@ def get_parser(): parser.add_argument( "--exp-dir", type=str, - default="transducer_stateless/randcombine1_expscale3_rework_0.5", + default="transducer_stateless/randcombine1_expscale3_rework_2.0", help="""The experiment dir. It specifies the directory where all training related files, e.g., checkpoints, log, etc, are saved