From 5ed6fc0e6d9afeebaf86ec83c16d9ff2c8d6a0ba Mon Sep 17 00:00:00 2001
From: marcoyang1998 <45973641+marcoyang1998@users.noreply.github.com>
Date: Wed, 12 Jul 2023 15:37:14 +0800
Subject: [PATCH 1/2] add sym link (#1170)

---
 egs/wenetspeech/ASR/local/prepare_char_lm_training_data.py | 1 +
 egs/wenetspeech/ASR/local/sort_lm_training_data.py         | 1 +
 2 files changed, 2 insertions(+)
 create mode 120000 egs/wenetspeech/ASR/local/prepare_char_lm_training_data.py
 create mode 120000 egs/wenetspeech/ASR/local/sort_lm_training_data.py

diff --git a/egs/wenetspeech/ASR/local/prepare_char_lm_training_data.py b/egs/wenetspeech/ASR/local/prepare_char_lm_training_data.py
new file mode 120000
index 000000000..2374cafdd
--- /dev/null
+++ b/egs/wenetspeech/ASR/local/prepare_char_lm_training_data.py
@@ -0,0 +1 @@
+../../../aishell/ASR/local/prepare_char_lm_training_data.py
\ No newline at end of file
diff --git a/egs/wenetspeech/ASR/local/sort_lm_training_data.py b/egs/wenetspeech/ASR/local/sort_lm_training_data.py
new file mode 120000
index 000000000..efef2c445
--- /dev/null
+++ b/egs/wenetspeech/ASR/local/sort_lm_training_data.py
@@ -0,0 +1 @@
+../../../aishell/ASR/local/sort_lm_training_data.py
\ No newline at end of file

From 4ab7d610081c0c3b38dd851298cb45381e6ac591 Mon Sep 17 00:00:00 2001
From: zr_jin <60612200+JinZr@users.noreply.github.com>
Date: Sat, 15 Jul 2023 12:39:32 +0800
Subject: [PATCH 2/2] removed `batch_name` to fix a KeyError with "uttid"
 (#1172)

---
 egs/librispeech/ASR/conformer_ctc2/train.py | 11 ++---------
 1 file changed, 2 insertions(+), 9 deletions(-)

diff --git a/egs/librispeech/ASR/conformer_ctc2/train.py b/egs/librispeech/ASR/conformer_ctc2/train.py
index 3366af13e..c4a13b101 100755
--- a/egs/librispeech/ASR/conformer_ctc2/train.py
+++ b/egs/librispeech/ASR/conformer_ctc2/train.py
@@ -675,7 +675,6 @@ def train_one_epoch(
     for batch_idx, batch in enumerate(train_dl):
         params.batch_idx_train += 1
         batch_size = len(batch["supervisions"]["text"])
-        batch_name = batch["supervisions"]["uttid"]
 
         with torch.cuda.amp.autocast(enabled=params.use_fp16):
             loss, loss_info = compute_loss(
@@ -698,10 +697,7 @@ def train_one_epoch(
             scaler.scale(loss).backward()
         except RuntimeError as e:
             if "CUDA out of memory" in str(e):
-                logging.error(
-                    f"failing batch size:{batch_size} "
-                    f"failing batch names {batch_name}"
-                )
+                logging.error(f"failing batch size:{batch_size} ")
             raise
 
         scheduler.step_batch(params.batch_idx_train)
@@ -756,10 +752,7 @@ def train_one_epoch(
             if loss_info["ctc_loss"] == float("inf") or loss_info["att_loss"] == float(
                 "inf"
             ):
-                logging.error(
-                    "Your loss contains inf, something goes wrong"
-                    f"failing batch names {batch_name}"
-                )
+                logging.error("Your loss contains inf, something goes wrong")
             if tb_writer is not None:
                 tb_writer.add_scalar(
                     "train/learning_rate", cur_lr, params.batch_idx_train