Increase ratio from 2.0 to 3.0 on 2 whitening schedules

This commit is contained in:
Daniel Povey 2022-12-13 22:50:21 +08:00
parent 22204450db
commit 48445f22e4

View File

@ -1297,7 +1297,7 @@ class SelfAttention(nn.Module):
initial_scale=0.05)
self.whiten = Whiten(num_groups=1,
whitening_limit=_whitening_schedule(7.5),
whitening_limit=_whitening_schedule(7.5, ratio=3.0),
prob=(0.025, 0.25),
grad_scale=0.01)
@ -1534,7 +1534,7 @@ class NonlinAttentionModule(nn.Module):
grad_scale=0.01)
self.whiten2 = Whiten(num_groups=1,
whitening_limit=_whitening_schedule(5.0),
whitening_limit=_whitening_schedule(5.0, ratio=3.0),
prob=(0.025, 0.25),
grad_scale=0.01)