From f9954263241973f07da3c790f48a8ef4edcd5889 Mon Sep 17 00:00:00 2001
From: Daniel Povey <dpovey@gmail.com>
Date: Sat, 29 Oct 2022 15:40:47 +0800
Subject: [PATCH] Reduce min of bypass_scale from 0.5 to 0.3, and make it not
 applied in test mode.

---
 .../ASR/pruned_transducer_stateless7/zipformer.py   | 13 +++++++------
 1 file changed, 7 insertions(+), 6 deletions(-)

diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py
index fd9a7cd8b..d06362c96 100644
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py
@@ -363,12 +363,13 @@ class ZipformerEncoderLayer(nn.Module):
 
         delta = src - src_orig
         bypass_scale = self.bypass_scale
-        if torch.jit.is_scripting() or (not self.training) or random.random() > 0.1:
-            # with probability 0.9, in training mode, or always, in testing
-            # mode, clamp bypass_scale to [ 0.1, 1.0 ]; this will encourage it
-            # to learn parameters within this range by making parameters that
-            # are outside that range range noisy.
-            bypass_scale = bypass_scale.clamp(min=0.5, max=1.0)
+        if self.training and random.random() > 0.1:
+            # with probability 0.9, in training mode clamp bypass_scale to [
+            # 0.3, 1.0 ]; this will encourage it to learn parameters within this
+            # range by making parameters that are outside that range range
+            # noisy.  For testing don't bother, as it will anyway end up
+            # learning values within this range or very close to it.
+            bypass_scale = bypass_scale.clamp(min=0.3, max=1.0)
         src = src_orig + delta * bypass_scale
 
         return self.whiten(src)