diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py index 35ae7624c..8734f266e 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py @@ -1334,7 +1334,9 @@ class ConvolutionModule(nn.Module): ) self.deriv_balancer2 = ActivationBalancer( - channels, channel_dim=1, min_positive=0.05, max_positive=1.0 + channels, channel_dim=1, + min_positive=0.05, max_positive=1.0, + max_abs=20.0, ) self.activation = DoubleSwish() diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py index 676110675..79ed592da 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py @@ -477,7 +477,7 @@ class ActivationBalancer(torch.nn.Module): channel_dim: int, min_positive: float = 0.05, max_positive: float = 0.95, - max_factor: float = 0.02, + max_factor: float = 0.04, sign_gain_factor: float = 0.01, scale_gain_factor: float = 0.02, min_abs: float = 0.2,