decrease learning-rate to solve the error: RuntimeError: grad_scale is too small, exiting: 5.820766091346741e-11

2025-08-26 18:24:18 +00:00 · 2024-01-14 12:12:15 -05:00 · 2024-01-14 12:12:15 -05:00 · 42c152f5cb
commit 42c152f5cb
parent ced8a53cdc
1 changed files with 1 additions and 3 deletions
--- a/egs/reazonspeech/ASR/zipformer/train.py
+++ b/egs/reazonspeech/ASR/zipformer/train.py
@ -30,7 +30,6 @@ export CUDA_VISIBLE_DEVICES="0,1,2,3"
  --start-epoch 1 \
  --use-fp16 1 \
  --exp-dir zipformer/exp \
-  --full-libri 1 \
  --max-duration 1000

 # For streaming model training:
@ -41,7 +40,6 @@ export CUDA_VISIBLE_DEVICES="0,1,2,3"
  --use-fp16 1 \
  --exp-dir zipformer/exp \
  --causal 1 \
-  --full-libri 1 \
  --max-duration 1000

 It supports training with:
@ -330,7 +328,7 @@ def get_parser():
    )

    parser.add_argument(
-        "--base-lr", type=float, default=0.045, help="The base learning rate."
+        "--base-lr", type=float, default=0.035, help="The base learning rate."
    )

    parser.add_argument(