From 7e889996413bc757c2cc7160c6e96644467ab57e Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Fri, 4 Mar 2022 14:31:29 +0800 Subject: [PATCH] Increase scale from 20 to 50. --- egs/librispeech/ASR/conformer_ctc/subsampling.py | 4 ++-- egs/librispeech/ASR/transducer_stateless/conformer.py | 4 ++-- egs/librispeech/ASR/transducer_stateless/train.py | 2 +- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/egs/librispeech/ASR/conformer_ctc/subsampling.py b/egs/librispeech/ASR/conformer_ctc/subsampling.py index e38a94d09..97b9ae97b 100644 --- a/egs/librispeech/ASR/conformer_ctc/subsampling.py +++ b/egs/librispeech/ASR/conformer_ctc/subsampling.py @@ -48,12 +48,12 @@ class Conv2dSubsampling(nn.Module): in_channels=1, out_channels=odim, kernel_size=3, stride=2 ), nn.ReLU(), - ExpScale(odim, 1, 1, speed=20.0), + ExpScale(odim, 1, 1, speed=50.0), nn.Conv2d( in_channels=odim, out_channels=odim, kernel_size=3, stride=2 ), nn.ReLU(), - ExpScale(odim, 1, 1, speed=20.0), + ExpScale(odim, 1, 1, speed=50.0), ) self.out = nn.Linear(odim * (((idim - 1) // 2 - 1) // 2), odim) self.out_norm = nn.LayerNorm(odim, elementwise_affine=False) diff --git a/egs/librispeech/ASR/transducer_stateless/conformer.py b/egs/librispeech/ASR/transducer_stateless/conformer.py index 6907feb26..ef6b4ac97 100644 --- a/egs/librispeech/ASR/transducer_stateless/conformer.py +++ b/egs/librispeech/ASR/transducer_stateless/conformer.py @@ -156,7 +156,7 @@ class ConformerEncoderLayer(nn.Module): self.feed_forward = nn.Sequential( nn.Linear(d_model, dim_feedforward), - ExpScaleSwish(dim_feedforward, speed=20.0), + ExpScaleSwish(dim_feedforward, speed=50.0), nn.Dropout(dropout), nn.Linear(dim_feedforward, d_model), ) @@ -164,7 +164,7 @@ class ConformerEncoderLayer(nn.Module): self.feed_forward_macaron = nn.Sequential( nn.Linear(d_model, dim_feedforward), Swish(), - ExpScaleSwish(dim_feedforward, speed=20.0), + ExpScaleSwish(dim_feedforward, speed=50.0), nn.Dropout(dropout), nn.Linear(dim_feedforward, d_model), ) diff --git a/egs/librispeech/ASR/transducer_stateless/train.py b/egs/librispeech/ASR/transducer_stateless/train.py index c57968428..980633ed6 100755 --- a/egs/librispeech/ASR/transducer_stateless/train.py +++ b/egs/librispeech/ASR/transducer_stateless/train.py @@ -110,7 +110,7 @@ def get_parser(): parser.add_argument( "--exp-dir", type=str, - default="transducer_stateless/specaugmod_baseline_randcombine1_expscale3", + default="transducer_stateless/specaugmod_baseline_randcombine1_expscale4", help="""The experiment dir. It specifies the directory where all training related files, e.g., checkpoints, log, etc, are saved