diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.bitfit.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.bitfit.py.swp index dbee27a9d..541ad6e4d 100644 Binary files a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.bitfit.py.swp and b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.bitfit.py.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/bitfit.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/bitfit.py index b9ec2eb62..8809e7f02 100755 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/bitfit.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/bitfit.py @@ -1587,6 +1587,12 @@ def run_adapter(rank, world_size, args, wb=None): adapter_names = [] adapter_param = [] for n, p in model.named_parameters(): + if 'bias' in n: + adapter_names.append(n) + adapter_param.append(p) + else: + p.requires_grad = False + ''' if 'adapters' in n:# or 'joiner' in n or 'simple' in n or 'ctc' in n: adapter_names.append(n) adapter_param.append(p) @@ -1594,6 +1600,7 @@ def run_adapter(rank, world_size, args, wb=None): p.requires_grad = True else: p.requires_grad = False + ''' for n, p in model.named_parameters(): p.requires_grad = False