reduce initial scale in GradScaler

This commit is contained in:
Daniel Povey 2022-10-23 00:14:38 +08:00
parent b7083e7aff
commit 9e86d1f44f

View File

@ -1046,7 +1046,8 @@ def run(rank, world_size, args):
params=params, params=params,
) )
scaler = GradScaler(enabled=params.use_fp16) scaler = GradScaler(enabled=params.use_fp16,
init_scale=1.0)
if checkpoints and "grad_scaler" in checkpoints: if checkpoints and "grad_scaler" in checkpoints:
logging.info("Loading grad scaler state dict") logging.info("Loading grad scaler state dict")
scaler.load_state_dict(checkpoints["grad_scaler"]) scaler.load_state_dict(checkpoints["grad_scaler"])