From d6aa386552505e4ceb7d1a03b38b9854974a88e7 Mon Sep 17 00:00:00 2001
From: Daniel Povey <dpovey@gmail.com>
Date: Sun, 23 Oct 2022 17:19:19 +0800
Subject: [PATCH] Fix randn to rand

---
 .../ASR/pruned_transducer_stateless7/scaling.py        | 10 ++++++----
 1 file changed, 6 insertions(+), 4 deletions(-)

diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py
index e31548737..be6f94412 100644
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/scaling.py
@@ -915,13 +915,15 @@ class DoubleSwishFunction(torch.autograd.Function):
 
     @staticmethod
     def forward(ctx, x: Tensor) -> Tensor:
+        requires_grad = x.requires_grad
         x = x.detach()
         s = torch.sigmoid(x - 1.0)
         y = x * s
-        # discretize s.  This should be expectation-preserving if we just divide the
-        # result by 255.
-        s = ((s * 255) + torch.randn_like(s)).to(torch.uint8)
-        ctx.save_for_backward(s, y)
+        if requires_grad:
+            # discretize s.  This should be expectation-preserving if we just divide the
+            # result by 255.
+            s = ((s * 255) + torch.rand_like(s)).to(torch.uint8)
+            ctx.save_for_backward(s, y)
         return y
 
     @staticmethod