mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-12-11 06:55:27 +00:00
Change to schedule of bypass_scale min: make it larger, decrease slower.
This commit is contained in:
parent
efbb1d25c7
commit
b8db0f53f1
@ -371,9 +371,9 @@ class ZipformerEncoderLayer(nn.Module):
|
|||||||
# ensure we get grads if self.bypass_scale becomes out of range
|
# ensure we get grads if self.bypass_scale becomes out of range
|
||||||
return self.bypass_scale
|
return self.bypass_scale
|
||||||
# hardcode warmup period for bypass scale
|
# hardcode warmup period for bypass scale
|
||||||
warmup_period = 4000.0
|
warmup_period = 20000.0
|
||||||
initial_clamp_min = 0.5
|
initial_clamp_min = 1.0
|
||||||
final_clamp_min = 0.2
|
final_clamp_min = 0.3
|
||||||
if self.batch_count > warmup_period:
|
if self.batch_count > warmup_period:
|
||||||
clamp_min = final_clamp_min
|
clamp_min = final_clamp_min
|
||||||
else:
|
else:
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user