From 9a72567b7f8a03863afdafb2b862bfa709b38d44 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Sat, 17 Dec 2022 21:57:21 +0800 Subject: [PATCH] Restore two nonlinearities. --- .../pruned_transducer_stateless7/zipformer.py | 21 +++++++++++++------ 1 file changed, 15 insertions(+), 6 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py index 75d24106a..6e938837d 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py @@ -1792,18 +1792,27 @@ class Conv2dSubsampling(nn.Module): stride=2, padding=0, ), + ActivationBalancer(layer2_channels, + channel_dim=1, + max_abs=4.0), + SwooshR(), ) self.convnext1 = nn.Sequential(ConvNeXt(layer2_channels), ConvNeXt(layer2_channels)) self.conv2 = nn.Sequential( - nn.Conv2d( - in_channels=layer2_channels, - out_channels=layer3_channels, - kernel_size=3, - stride=(1, 2), # (time, freq) - )) + nn.Conv2d( + in_channels=layer2_channels, + out_channels=layer3_channels, + kernel_size=3, + stride=(1, 2), # (time, freq) + ), + ActivationBalancer(layer3_channels, + channel_dim=1, + max_abs=4.0), + SwooshR(), + ) self.convnext2 = nn.Sequential(ConvNeXt(layer3_channels), ConvNeXt(layer3_channels))