From 4a4d12c9944b18d9e81e5af22c1dc835deab8586 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Sat, 31 Dec 2022 21:52:11 +0800 Subject: [PATCH] Revert kernel size of convnext2 from 5x5 to 7x7 --- .../ASR/pruned_transducer_stateless7/zipformer.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py index 4a946db5a..4e67ed35e 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py @@ -1869,9 +1869,9 @@ class Conv2dSubsampling(nn.Module): SwooshR(), ) - self.convnext2 = nn.Sequential(ConvNeXt(layer3_channels, kernel_size=(5, 5)), - ConvNeXt(layer3_channels, kernel_size=(5, 5)), - ConvNeXt(layer3_channels, kernel_size=(5, 5))) + self.convnext2 = nn.Sequential(ConvNeXt(layer3_channels, kernel_size=(7, 7)), + ConvNeXt(layer3_channels, kernel_size=(7, 7)), + ConvNeXt(layer3_channels, kernel_size=(7, 7))) out_width = (((in_channels - 1) // 2) - 1) // 2