From 31f2f95f597f8758c5f338eb80fcef5a050fbdcd Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Fri, 9 Dec 2022 20:01:19 +0800 Subject: [PATCH 1/3] reduce min_abs of ff module from 1.0 to 0.75 --- egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py index 315b10730..9403cc7d8 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py @@ -1437,7 +1437,7 @@ class FeedforwardModule(nn.Module): channel_dim=-1, min_positive=0.3, max_positive=1.0, - min_abs=1.0, + min_abs=0.75, max_abs=5.0, min_prob=0.25) self.activation = SwooshL() From a92df3e850f0c6cd1d40d3a63640bd7e13fae768 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Fri, 9 Dec 2022 20:03:37 +0800 Subject: [PATCH 2/3] Reduce final min_abs on conv_module from 1.0 to 0.75. --- egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py index 9403cc7d8..735f08d98 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py @@ -1633,7 +1633,7 @@ class ConvolutionModule(nn.Module): bottleneck_dim, channel_dim=1, min_positive=ScheduledFloat((0.0, 0.1), (8000.0, 0.05)), max_positive=1.0, - min_abs=ScheduledFloat((0.0, 0.2), (20000.0, 1.0)), + min_abs=ScheduledFloat((0.0, 0.2), (20000.0, 0.75)), max_abs=10.0, ) From a00ed7e976cf49cd47e80bffea5e140dbed229f4 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Fri, 9 Dec 2022 20:05:50 +0800 Subject: [PATCH 3/3] Decrease min_abs of NonlinAttentionModule from 0.75 to 0.5; make its max_abs (not active) a constant. --- egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py index 735f08d98..37be53c2a 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py @@ -1489,8 +1489,8 @@ class NonlinAttentionModule(nn.Module): hidden_channels, channel_dim=-1, min_positive=ScheduledFloat((0.0, 0.25), (20000.0, 0.05)), max_positive=ScheduledFloat((0.0, 0.75), (20000.0, 0.95)), - min_abs=0.75, - max_abs=ScheduledFloat((0.0, 2.5), (8000.0, 5.0), default=1.0), + min_abs=0.5, + max_abs=5.0, ) self.tanh = nn.Tanh()