From cf450908c634fecf7a21334006504e471f416273 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Sun, 9 Oct 2022 14:25:53 +0800 Subject: [PATCH] Revert also the changes in scaled_adam_exp85 regarding warmup schedule --- .../ASR/pruned_transducer_stateless7/conformer.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py index eae352d9d..acb669497 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py @@ -96,13 +96,14 @@ class Conformer(EncoderInterface): ) # for the first third of the warmup period, we let the Conv2dSubsampling - # layer learn something + # layer learn something. then start warmup up the first and then the second + # encoder. self.encoder1 = ConformerEncoder( encoder_layer1, num_encoder_layers[0], dropout, - warmup_begin=0, - warmup_end=warmup_batches / 2, + warmup_begin=warmup_batches / 3, + warmup_end=warmup_batches * 2 / 3, ) encoder_layer2 = ConformerEncoderLayer( d_model[1], @@ -117,7 +118,7 @@ class Conformer(EncoderInterface): encoder_layer2, num_encoder_layers[1], dropout, - warmup_begin=warmup_batches / 2, + warmup_begin=warmup_batches * 2 / 3, warmup_end=warmup_batches, ), input_dim=d_model[0],