From e73ced16073496fa24e4c5970fc4c1a29fc04455 Mon Sep 17 00:00:00 2001
From: Daniel Povey <dpovey@gmail.com>
Date: Thu, 17 Nov 2022 16:02:57 +0800
Subject: [PATCH] Bug fix in formula for pos embedding

---
 egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py
index 0d275832b..4e7261fd0 100644
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/zipformer.py
@@ -932,8 +932,7 @@ class CompactRelPositionalEncoding(torch.nn.Module):
         # but it does so more slowly than T for large absolute values of T.
         # The formula is chosen so that d(x_compressed )/dx is 1 around x == 0, which
         # is important.
-        x_compressed = compression_length * x.sign() * (x.abs() + compression_length).log()
-
+        x_compressed = compression_length * x.sign() * ((x.abs() + compression_length).log() - math.log(compression_length))
 
         # length_factor is chosen so that the FFT can exactly separate points
         # close to the origin (T == 0).  So this part of the formulation is not really