From 465d41c4299ba479eed867d7a943379ce4398c79 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Tue, 16 May 2023 12:13:13 +0800 Subject: [PATCH] Increase batch size --- egs/libriheavy/LM/zipformer1/train.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/egs/libriheavy/LM/zipformer1/train.py b/egs/libriheavy/LM/zipformer1/train.py index 89d54701b..fedd5b3d4 100755 --- a/egs/libriheavy/LM/zipformer1/train.py +++ b/egs/libriheavy/LM/zipformer1/train.py @@ -128,7 +128,7 @@ def add_model_arguments(parser: argparse.ArgumentParser): parser.add_argument( "--feedforward-dim", type=str, - default="512,768,1024,1536,1024,768,512", + default="768,1024,1536,2048,1536,1024,768", help="Feedforward dimension of the subformer encoder layers, per stack, comma separated.", ) @@ -142,7 +142,7 @@ def add_model_arguments(parser: argparse.ArgumentParser): parser.add_argument( "--encoder-dim", type=str, - default="256,256,384,512,384,256,256", + default="256,384,512,768,512,384,256", help="Embedding dimension in encoder stacks: a single int or comma-separated list." ) @@ -156,7 +156,7 @@ def add_model_arguments(parser: argparse.ArgumentParser): parser.add_argument( "--value-head-dim", type=str, - default="12", + default="16", help="Value dimension per head in encoder stacks: a single int or comma-separated list." ) @@ -437,7 +437,7 @@ def get_params() -> AttributeDict: "warm_step": 2000, "env_info": get_env_info(), "bytes_per_segment": 2048, - "batch_size": 18, + "batch_size": 16, "train_file_list": "train.txt", "valid_file_list": "valid.txt", "num_workers": 4,