diff --git a/egs/librispeech/ASR/pruned_transducer_stateless4/train.py b/egs/librispeech/ASR/pruned_transducer_stateless4/train.py index 5d9683d54..a047c2045 100755 --- a/egs/librispeech/ASR/pruned_transducer_stateless4/train.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless4/train.py @@ -872,7 +872,8 @@ def run(rank, world_size, args): logging.info("Using DDP") model = DDP(model, device_ids=[rank]) - optimizer = Cain(model.parameters(), lr=params.initial_lr) + optimizer = Cain(model.parameters(), lr=params.initial_lr, + max_eff_lr=2.0*params.initial_lr) scheduler = Eden(optimizer, params.lr_batches, params.lr_epochs)