mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-09-18 21:44:18 +00:00
Adding max_abs=3.0 to ActivationBalancer modules inside feedoforward modules.
This commit is contained in:
parent
23e6d2e6d8
commit
de1fd91435
@ -176,7 +176,7 @@ class ConformerEncoderLayer(nn.Module):
|
||||
|
||||
self.feed_forward = nn.Sequential(
|
||||
nn.Linear(d_model, dim_feedforward),
|
||||
ActivationBalancer(channel_dim=-1),
|
||||
ActivationBalancer(channel_dim=-1, max_abs=3.0),
|
||||
DoubleSwish(),
|
||||
nn.Dropout(dropout),
|
||||
ScaledLinear(dim_feedforward, d_model,
|
||||
@ -185,7 +185,7 @@ class ConformerEncoderLayer(nn.Module):
|
||||
|
||||
self.feed_forward_macaron = nn.Sequential(
|
||||
nn.Linear(d_model, dim_feedforward),
|
||||
ActivationBalancer(channel_dim=-1),
|
||||
ActivationBalancer(channel_dim=-1, max_abs=3.0),
|
||||
DoubleSwish(),
|
||||
nn.Dropout(dropout),
|
||||
ScaledLinear(dim_feedforward, d_model,
|
||||
|
Loading…
x
Reference in New Issue
Block a user