mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-09-19 05:54:20 +00:00
Restoring min_abs and max_abs defaults for the linear_pos proj.
This commit is contained in:
parent
a55f8c9c14
commit
e1182da6ac
@ -468,8 +468,7 @@ class RelPositionMultiheadAttention(nn.Module):
|
|||||||
|
|
||||||
self.in_proj = nn.Linear(embed_dim, 3 * embed_dim, bias=True)
|
self.in_proj = nn.Linear(embed_dim, 3 * embed_dim, bias=True)
|
||||||
self.in_balancer = ActivationBalancer(channel_dim=-1, max_abs=5.0)
|
self.in_balancer = ActivationBalancer(channel_dim=-1, max_abs=5.0)
|
||||||
self.proj_balancer = ActivationBalancer(channel_dim=-1, min_positive=0.0,
|
self.proj_balancer = ActivationBalancer(channel_dim=-1, max_abs=10.0)
|
||||||
max_positive=1.0, max_abs=10.0)
|
|
||||||
self.out_proj = ScaledLinear(
|
self.out_proj = ScaledLinear(
|
||||||
embed_dim, embed_dim, bias=True, initial_scale=0.5
|
embed_dim, embed_dim, bias=True, initial_scale=0.5
|
||||||
)
|
)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user