Increase initial whitening target for self_attn from 2.0 to 3.0.

This commit is contained in:
Daniel Povey 2022-11-24 15:18:28 +08:00
parent 45069175d9
commit 0ac26f4234

View File

@ -1055,7 +1055,7 @@ class RelPositionMultiheadAttentionWeights(nn.Module):
initial_scale=query_head_dim**-0.25) initial_scale=query_head_dim**-0.25)
self.whiten_keys = Whiten(num_groups=num_heads, self.whiten_keys = Whiten(num_groups=num_heads,
whitening_limit=_whitening_schedule(2.0), whitening_limit=_whitening_schedule(3.0),
prob=(0.025, 0.25), prob=(0.025, 0.25),
grad_scale=0.025) grad_scale=0.025)