From 9e86d1f44fdf388288d2186ac05758ab305eb2ed Mon Sep 17 00:00:00 2001 From: Daniel Povey Date: Sun, 23 Oct 2022 00:14:38 +0800 Subject: [PATCH] reduce initial scale in GradScaler --- egs/librispeech/ASR/pruned_transducer_stateless7/train.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7/train.py b/egs/librispeech/ASR/pruned_transducer_stateless7/train.py index 92d833459..763911765 100755 --- a/egs/librispeech/ASR/pruned_transducer_stateless7/train.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7/train.py @@ -1046,7 +1046,8 @@ def run(rank, world_size, args): params=params, ) - scaler = GradScaler(enabled=params.use_fp16) + scaler = GradScaler(enabled=params.use_fp16, + init_scale=1.0) if checkpoints and "grad_scaler" in checkpoints: logging.info("Loading grad scaler state dict") scaler.load_state_dict(checkpoints["grad_scaler"])