diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train_lora.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train_lora.py.swp index 04bdd989b..c2a1fa784 100644 Binary files a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train_lora.py.swp and b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train_lora.py.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train_lora.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train_lora.py index 266556e3e..e69f30326 100755 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train_lora.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train_lora.py @@ -1592,6 +1592,7 @@ def run_adapter(rank, world_size, args, wb=None): model = DDP(model, device_ids=[rank], find_unused_parameters=True) print('-'*30) + lora_module = [] for i, module in enumerate(model.modules()): if isinstance(module, fairseq.modules.multihead_attention.MultiheadAttention): for m in module.modules():