From 34c9261f62c847ac404678f08291d99b4cb8f856 Mon Sep 17 00:00:00 2001
From: danqing fu <danqing.fu@gmail.com>
Date: Tue, 6 Jun 2023 13:12:35 +0800
Subject: [PATCH] minor fixes

---
 egs/librispeech/ASR/zipformer/zipformer.py | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/egs/librispeech/ASR/zipformer/zipformer.py b/egs/librispeech/ASR/zipformer/zipformer.py
index 85ebdb56e..660bdeb1d 100644
--- a/egs/librispeech/ASR/zipformer/zipformer.py
+++ b/egs/librispeech/ASR/zipformer/zipformer.py
@@ -1305,11 +1305,11 @@ class CompactRelPositionalEncoding(torch.nn.Module):
     ) -> None:
         """Construct a CompactRelPositionalEncoding object."""
         super(CompactRelPositionalEncoding, self).__init__()
-        if torch.jit.is_tracing:
-            # 10k frames correspond to ~100k ms, e.g., 100 seconds, i.e., 
-            # It assumes that the maximum input won't have more than 
-            # 10k frames. 
-            #
+        if torch.jit.is_tracing():
+            # It assumes that the maximum input, after downsampling, won't have more than 
+            # 10k frames.
+            # The first downsampling factor is 2, so the maximum input 
+            # should contain less than 20k frames, e.g., less than 200 seconds, i.e., 3.33 minutes
             max_len = 10000
         self.embed_dim = embed_dim
         assert embed_dim % 2 == 0