Make it start warming up from the very start, and increase warmup_batches to 6k

This commit is contained in:
Daniel Povey 2022-10-08 19:09:41 +08:00
parent 5c99e97c3b
commit 2631f05c1f

View File

@ -101,8 +101,8 @@ class Conformer(EncoderInterface):
encoder_layer1, encoder_layer1,
num_encoder_layers[0], num_encoder_layers[0],
dropout, dropout,
warmup_begin=warmup_batches / 3, warmup_begin=0,
warmup_end=2 * warmup_batches / 3, warmup_end=warmup_batches / 2,
) )
encoder_layer2 = ConformerEncoderLayer( encoder_layer2 = ConformerEncoderLayer(
d_model[1], d_model[1],
@ -117,7 +117,7 @@ class Conformer(EncoderInterface):
encoder_layer2, encoder_layer2,
num_encoder_layers[1], num_encoder_layers[1],
dropout, dropout,
warmup_begin=2 * warmup_batches / 3, warmup_begin=warmup_batches / 2,
warmup_end=warmup_batches, warmup_end=warmup_batches,
), ),
input_dim=d_model[0], input_dim=d_model[0],