fix the mismatch in batch_idx_train

This commit is contained in:
zzasdf 2024-09-26 15:31:15 +08:00
parent 5c04c31292
commit 01c9d06e3f

View File

@ -424,8 +424,12 @@ def average_checkpoints_with_averaged_model(
state_dict_start = torch.load(filename_start, map_location=device)
state_dict_end = torch.load(filename_end, map_location=device)
average_period = state_dict_start["average_period"]
batch_idx_train_start = state_dict_start["batch_idx_train"]
batch_idx_train_start = (batch_idx_train_start // average_period) * average_period
batch_idx_train_end = state_dict_end["batch_idx_train"]
batch_idx_train_end = (batch_idx_train_end // average_period) * average_period
interval = batch_idx_train_end - batch_idx_train_start
assert interval > 0, interval
weight_end = batch_idx_train_end / interval