mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-12-11 06:55:27 +00:00
Increase penalty cutoff in NonlinAttention to 40.
This commit is contained in:
parent
09294c0b51
commit
d0309c3f3d
@ -1758,7 +1758,7 @@ class NonlinAttention(nn.Module):
|
||||
|
||||
# ensure the activations after multiplication don't get too large.
|
||||
self.hidden_penalty = AbsValuePenalizer(
|
||||
limit=10.0, penalty=1.0e-04, prob=0.1)
|
||||
limit=40.0, penalty=1.0e-04, prob=0.1)
|
||||
|
||||
self.out_proj = ScaledLinear(hidden_channels, channels,
|
||||
bias=True,
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user