Make it use float16 if in amp but use clamp to avoid wrapping error

2022-10-23 21:13:23 +08:00 · 2022-10-23 21:13:23 +08:00 · d3876e32c4
commit d3876e32c4
parent 85657946bb
1 changed files with 1 additions and 2 deletions
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py
@ -922,8 +922,7 @@ class DoubleSwishFunction(torch.autograd.Function):
        if requires_grad:
            # discretize s.  This should be expectation-preserving if we just divide the
            # result by 255.
-            s = s.to(torch.float)
-            s = ((s * 254.99) + torch.rand_like(s)).to(torch.uint8)
+            s = ((s * 255) + torch.rand_like(s)).clamp(max=255).to(torch.uint8)
            ctx.save_for_backward(s, y)
        return y