Change to balancer2 schedule of NonlinAttentionModule, remove peak at 8k.

This commit is contained in:
Daniel Povey 2022-12-13 19:22:43 +08:00
parent 117d418e27
commit 52d18e405e

View File

@ -1541,7 +1541,7 @@ class NonlinAttentionModule(nn.Module):
self.balancer2 = ActivationBalancer(
channels, channel_dim=-1,
min_positive=0.3, max_positive=0.7,
min_abs=ScheduledFloat((0.0, 0.001), (8000.0, 0.01), (20000.0, 0.005)),
min_abs=ScheduledFloat((0.0, 0.001), (20000.0, 0.005)),
)