mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-09 10:02:22 +00:00
Fix weight decay formula by adding 1/1-beta
This commit is contained in:
parent
2b0727a355
commit
47d49f29d7
@ -161,7 +161,7 @@ class Eve(Optimizer):
|
||||
#
|
||||
# Regarding the 1/1-beta factor below: this is to compensate for the deltas on successive
|
||||
# frames being correlated. I have to figure out the justification.
|
||||
weight_decay = (delta ** 2).mean() * (0.5 * (step_size / target_rms) ** 2 * (1.0 / (1.0 - beta)))
|
||||
weight_decay = (delta ** 2).mean() * (0.5 * (step_size / target_rms) ** 2 * (1.0 / (1.0 - beta1)))
|
||||
|
||||
p.mul_(1 - weight_decay)
|
||||
p.add_(delta, alpha=-step_size)
|
||||
|
Loading…
x
Reference in New Issue
Block a user