From f3b918452ac6b210c25651f974bc8e8141aff101 Mon Sep 17 00:00:00 2001 From: jinzr <60612200+JinZr@users.noreply.github.com> Date: Thu, 19 Oct 2023 11:09:20 +0800 Subject: [PATCH] arch align --- egs/ami/ASR/zipformer/train.py | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/egs/ami/ASR/zipformer/train.py b/egs/ami/ASR/zipformer/train.py index 7d42e87b4..6efa085c2 100755 --- a/egs/ami/ASR/zipformer/train.py +++ b/egs/ami/ASR/zipformer/train.py @@ -127,35 +127,35 @@ def add_model_arguments(parser: argparse.ArgumentParser): parser.add_argument( "--num-encoder-layers", type=str, - default="2,2,3,4,3,2", + default="2,4,3,2,4", help="Number of zipformer encoder layers per stack, comma separated.", ) parser.add_argument( "--downsampling-factor", type=str, - default="1,2,4,8,4,2", + default="1,2,4,8,2", help="Downsampling factor for each stack of encoder layers.", ) parser.add_argument( "--feedforward-dim", type=str, - default="512,768,1024,1536,1024,768", + default="1024,1024,2048,2048,1024", help="Feedforward dimension of the zipformer encoder layers, per stack, comma separated.", ) parser.add_argument( "--num-heads", type=str, - default="4,4,4,8,4,4", + default="8,8,8,8,8", help="Number of attention heads in the zipformer encoder layers: a single int or comma-separated list.", ) parser.add_argument( "--encoder-dim", type=str, - default="192,256,384,512,384,256", + default="384,384,384,384,384", help="Embedding dimension in encoder stacks: a single int or comma-separated list.", ) @@ -190,7 +190,7 @@ def add_model_arguments(parser: argparse.ArgumentParser): parser.add_argument( "--encoder-unmasked-dim", type=str, - default="192,192,256,256,256,192", + default="256,256,256,256,256", help="Unmasked dimensions in the encoders, relates to augmentation during training. " "A single int or comma-separated list. Must be <= each corresponding encoder_dim.", ) @@ -198,7 +198,7 @@ def add_model_arguments(parser: argparse.ArgumentParser): parser.add_argument( "--cnn-module-kernel", type=str, - default="31,31,15,15,15,31", + default="31,31,31,31,31", help="Sizes of convolutional kernels in convolution modules in each encoder stack: " "a single int or comma-separated list.", ) @@ -329,7 +329,7 @@ def get_parser(): ) parser.add_argument( - "--base-lr", type=float, default=0.045, help="The base learning rate." + "--base-lr", type=float, default=0.05, help="The base learning rate." ) parser.add_argument(