From b7083e7aff86a618e46f95663489312355260ed8 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Sun, 23 Oct 2022 00:09:21 +0800 Subject: [PATCH] Increase default max_factor for ActivationBalancer from 0.02 to 0.04; decrease max_abs in ConvolutionModule.deriv_balancer2 from 100.0 to 20.0 --- egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py | 4 +++- egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py | 2 +- 2 files changed, 4 insertions(+), 2 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py index 35ae7624c..8734f266e 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py @@ -1334,7 +1334,9 @@ class ConvolutionModule(nn.Module): ) self.deriv_balancer2 = ActivationBalancer( - channels, channel_dim=1, min_positive=0.05, max_positive=1.0 + channels, channel_dim=1, + min_positive=0.05, max_positive=1.0, + max_abs=20.0, ) self.activation = DoubleSwish() diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py index 676110675..79ed592da 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py @@ -477,7 +477,7 @@ class ActivationBalancer(torch.nn.Module): channel_dim: int, min_positive: float = 0.05, max_positive: float = 0.95, - max_factor: float = 0.02, + max_factor: float = 0.04, sign_gain_factor: float = 0.01, scale_gain_factor: float = 0.02, min_abs: float = 0.2,