mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-12-11 06:55:27 +00:00
Add warmup schedule where dropout disappears from earlier layers first.
This commit is contained in:
parent
9c1a239931
commit
300da1306d
@ -49,8 +49,7 @@ class Conformer(EncoderInterface):
|
||||
layer_dropout (float): layer-dropout rate.
|
||||
cnn_module_kernel (int): Kernel size of convolution module
|
||||
vgg_frontend (bool): whether to use vgg frontend.
|
||||
warmup_batches (float): number of batches to warm up over (gradually skip
|
||||
layer bypass)
|
||||
warmup_batches (float): number of batches to warm up over
|
||||
"""
|
||||
|
||||
def __init__(
|
||||
@ -65,7 +64,7 @@ class Conformer(EncoderInterface):
|
||||
num_encoder_layers: Tuple[int] = (12, 12),
|
||||
dropout: float = 0.1,
|
||||
cnn_module_kernel: Tuple[int] = (31, 31),
|
||||
warmup_batches: float = 3000,
|
||||
warmup_batches: float = 6000.0,
|
||||
) -> None:
|
||||
super(Conformer, self).__init__()
|
||||
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user