Fix regarding reverse_cutoff formula

2025-09-19 05:54:20 +00:00 · 2022-06-25 18:24:05 +08:00 · 2022-06-25 18:24:05 +08:00 · 0aa5a334d6
commit 0aa5a334d6
parent 8a0277d493
1 changed files with 2 additions and 4 deletions
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/optim.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/optim.py
@ -681,10 +681,10 @@ class NeutralGradient(Optimizer):
            if size == 1:
                continue
            param_diag_var = param_diag_vars[dim]
-            num_samples = (p.numel() // size) * 4 > size
+            num_samples = p.numel() // size
            # don't apply this reverse_cutoff thing in situations where we can't get a reasonable estimate
            # of param_cov even with stats accumulation, due to the shape of the tensor.
-            reverse_cutoff = (param_reverse_cutoff if num_samples > size//4 else 1.0e+10)
+            reverse_cutoff = (param_reverse_cutoff if num_samples > size // 4 else 1.0e+10)
            param_diag_var = self._smooth_param_diag_var(param_diag_var,
                                                         param_pow,
                                                         param_rel_eps,
@ -920,8 +920,6 @@ class NeutralGradient(Optimizer):
        # S_sqrt is S.sqrt() in the limit where param_pow == 1.0,
        # param_rel_eps=0, param_rel_max=inf

-        # don't apply this reverse_cutoff thing in situations where we can't get a reasonable estimate
-        # of param_cov even with stats accumulation, due to the shape of the tensor.
        S_smoothed = self._smooth_param_diag_var(S, param_pow,
                                                 param_rel_eps, param_rel_max,
                                                 param_reverse_cutoff)