mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-12-11 06:55:27 +00:00
Make the in_proj of feedforward modules also be a LinearWithAuxLoss.
This commit is contained in:
parent
029f5869c4
commit
d9c7e4f216
@ -1384,7 +1384,9 @@ class FeedforwardModule(nn.Module):
|
|||||||
feedforward_dim: int,
|
feedforward_dim: int,
|
||||||
dropout: float):
|
dropout: float):
|
||||||
super(FeedforwardModule, self).__init__()
|
super(FeedforwardModule, self).__init__()
|
||||||
self.in_proj = nn.Linear(embed_dim, feedforward_dim)
|
self.in_proj = LinearWithAuxLoss(embed_dim, feedforward_dim,
|
||||||
|
aux_grad_scale=ScheduledFloat((0.0, 0.2), (1000.0, 0.01)))
|
||||||
|
|
||||||
self.hidden_balancer = ActivationBalancer(feedforward_dim,
|
self.hidden_balancer = ActivationBalancer(feedforward_dim,
|
||||||
channel_dim=-1, max_abs=10.0,
|
channel_dim=-1, max_abs=10.0,
|
||||||
min_prob=0.25)
|
min_prob=0.25)
|
||||||
@ -1392,8 +1394,7 @@ class FeedforwardModule(nn.Module):
|
|||||||
self.dropout = nn.Dropout(dropout)
|
self.dropout = nn.Dropout(dropout)
|
||||||
self.out_proj = LinearWithAuxLoss(feedforward_dim, embed_dim,
|
self.out_proj = LinearWithAuxLoss(feedforward_dim, embed_dim,
|
||||||
initial_scale=0.01,
|
initial_scale=0.01,
|
||||||
aux_grad_scale=ScheduledFloat((0.0, 0.2), (1000.0, 0.01)),
|
aux_grad_scale=ScheduledFloat((0.0, 0.2), (1000.0, 0.01)))
|
||||||
)
|
|
||||||
self.out_whiten = Whiten(num_groups=1,
|
self.out_whiten = Whiten(num_groups=1,
|
||||||
whitening_limit=_whitening_schedule(7.5),
|
whitening_limit=_whitening_schedule(7.5),
|
||||||
prob=(0.025, 0.25),
|
prob=(0.025, 0.25),
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user