Use more attention heads in slowest layer.

2025-12-11 06:55:27 +00:00 · 2022-11-11 22:56:14 +08:00 · 2022-11-11 22:56:14 +08:00 · 4988c815c9
commit 4988c815c9
parent f7aff4f507
1 changed files with 1 additions and 1 deletions
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/train.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/train.py
@ -127,7 +127,7 @@ def add_model_arguments(parser: argparse.ArgumentParser):
    parser.add_argument(
        "--num-heads",
        type=str,
-        default="8",
+        default="8,8,8,16,8,8",
        help="Number of attention heads in the zipformer encoder layers: a single int or comma-separated list.",
    )