Fix duplicate Swish; replace norm+swish with swish+exp-scale in convolution module

2025-12-11 06:55:27 +00:00 · 2022-03-04 15:50:51 +08:00 · 2022-03-04 15:50:51 +08:00 · 9cc5999829
commit 9cc5999829
parent 7e88999641
2 changed files with 4 additions and 7 deletions
--- a/egs/librispeech/ASR/transducer_stateless/conformer.py
+++ b/egs/librispeech/ASR/transducer_stateless/conformer.py
@ -163,7 +163,6 @@ class ConformerEncoderLayer(nn.Module):
        self.feed_forward_macaron = nn.Sequential(
            nn.Linear(d_model, dim_feedforward),
            Swish(),
            ExpScaleSwish(dim_feedforward, speed=50.0),
            nn.Dropout(dropout),
            nn.Linear(dim_feedforward, d_model),
@ -874,7 +873,9 @@ class ConvolutionModule(nn.Module):
            groups=channels,
            bias=bias,
        )
-        self.norm = nn.LayerNorm(channels)
+        # shape: (channels, 1), broadcasts with (batch, channel, time).
        self.activation = ExpScaleSwish(channels, 1, speed=50.0)
        self.pointwise_conv2 = nn.Conv1d(
            channels,
            channels,
@ -883,7 +884,6 @@ class ConvolutionModule(nn.Module):
            padding=0,
            bias=bias,
        )
        self.activation = Swish()
    def forward(self, x: Tensor) -> Tensor:
        """Compute convolution module.
@ -905,9 +905,6 @@ class ConvolutionModule(nn.Module):
        # 1D Depthwise Conv
        x = self.depthwise_conv(x)
        # x is (batch, channels, time)
        x = x.permute(0, 2, 1)
        x = self.norm(x)
        x = x.permute(0, 2, 1)
        x = self.activation(x)
--- a/egs/librispeech/ASR/transducer_stateless/train.py
+++ b/egs/librispeech/ASR/transducer_stateless/train.py
@ -110,7 +110,7 @@ def get_parser():
    parser.add_argument(
        "--exp-dir",
        type=str,
-        default="transducer_stateless/specaugmod_baseline_randcombine1_expscale4",
+        default="transducer_stateless/specaugmod_baseline_randcombine1_expscale5",
        help="""The experiment dir.
        It specifies the directory where all training related
        files, e.g., checkpoints, log, etc, are saved