Merge branch 'scaled_adam_exp151' into scaled_adam_exp150

2022-10-19 19:59:07 +08:00 · 2022-10-19 19:59:07 +08:00 · f08a869769
commit f08a869769
parent a4443efa95 cc15552510
1 changed files with 7 additions and 4 deletions
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py
@ -255,10 +255,13 @@ class SoftmaxFunction(torch.autograd.Function):
    """
    @staticmethod
    def forward(ctx, x: Tensor, dim: int):
-        ans = x.softmax(dim=dim)
+        with torch.cuda.amp.autocast(enabled=False):
-        ctx.save_for_backward(ans)
+            if x.dtype == torch.float16:
-        ctx.dim = dim
+                x = x.to(torch.float32)
-        return ans
+            ans = x.softmax(dim=dim)
            ctx.save_for_backward(ans)
            ctx.dim = dim
            return ans
    @staticmethod
    def backward(ctx, ans_grad: Tensor):