diff --git a/egs/libriheavy/LM/zipformer1/subformer.py b/egs/libriheavy/LM/zipformer1/subformer.py index c049ab898..6b92b5fc8 100644 --- a/egs/libriheavy/LM/zipformer1/subformer.py +++ b/egs/libriheavy/LM/zipformer1/subformer.py @@ -813,6 +813,7 @@ class LearnedDownsamplingModule(nn.Module): super().__init__() self.to_scores = nn.Linear(embed_dim, 1, bias=False) + self.to_scores.lr_factor = 0.5 # score_balancer is just to keep the magnitudes of the scores in # a fixed range and keep them balanced around zero, to stop # these drifting around. @@ -820,7 +821,8 @@ class LearnedDownsamplingModule(nn.Module): self.score_balancer = Balancer(1, channel_dim=-1, min_positive=1/(2*downsampling_factor), max_positive=0.6, - min_abs=1.0) + min_abs=1.0, + max_abs=4.0) # below are for diagnostics. self.copy_weights1 = nn.Identity()