From 992f922f81a8faa949c6e4420b03ebba023d45e5 Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Sat, 21 May 2022 17:30:45 +0800 Subject: [PATCH] Make biases learn at twice the speed --- egs/librispeech/ASR/pruned_transducer_stateless4/train.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless4/train.py b/egs/librispeech/ASR/pruned_transducer_stateless4/train.py index af4bb577e..daccbee04 100755 --- a/egs/librispeech/ASR/pruned_transducer_stateless4/train.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless4/train.py @@ -872,8 +872,8 @@ def run(rank, world_size, args): model = DDP(model, device_ids=[rank]) - params_to_pass = [ {'params': [ p for (name,p) in model.named_parameters() if name != 'simple_am_proj.weight' ] }, - {'params': [ p for (name,p) in model.named_parameters() if name == 'simple_am_proj.weight' ], 'lr': params.initial_lr*0.25 } ] + params_to_pass = [ {'params': [ p for (name,p) in model.named_parameters() if 'bias' not in name] }, + {'params': [ p for (name,p) in model.named_parameters() if 'bias' in name ], 'lr': params.initial_lr*2.0 } ] optimizer = Cain(params_to_pass, lr=params.initial_lr)