diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py index cab0289c0..97fb79b25 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/conformer.py @@ -450,8 +450,8 @@ class ConformerEncoder(nn.Module): initial_layerdrop_prob = 0.5 final_layerdrop_prob = 0.05 - if warmup_count < 100.0: - # As a special case, if warmup_count < 100.0 return 0 (drop no + if warmup_count < 5.0: + # As a special case, if warmup_count < 5.0 return 0 (drop no # layers). This is rather ugly, I'm afraid; it is intended to # enable our scan_pessimistic_batches_for_oom() code to work correctly # so if we are going to get OOM it will happen early.