Make biases learn at twice the speed

This commit is contained in:
Daniel Povey 2022-05-21 17:30:45 +08:00
parent b7adb6d738
commit 992f922f81

View File

@ -872,8 +872,8 @@ def run(rank, world_size, args):
model = DDP(model, device_ids=[rank]) model = DDP(model, device_ids=[rank])
params_to_pass = [ {'params': [ p for (name,p) in model.named_parameters() if name != 'simple_am_proj.weight' ] }, params_to_pass = [ {'params': [ p for (name,p) in model.named_parameters() if 'bias' not in name] },
{'params': [ p for (name,p) in model.named_parameters() if name == 'simple_am_proj.weight' ], 'lr': params.initial_lr*0.25 } ] {'params': [ p for (name,p) in model.named_parameters() if 'bias' in name ], 'lr': params.initial_lr*2.0 } ]
optimizer = Cain(params_to_pass, lr=params.initial_lr) optimizer = Cain(params_to_pass, lr=params.initial_lr)