fix the mismatch in batch_idx_train (#1757)

This commit is contained in:
zzasdf 2024-10-12 19:14:28 +08:00 committed by GitHub
parent fbba712887
commit 2653df5bda
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -424,8 +424,12 @@ def average_checkpoints_with_averaged_model(
state_dict_start = torch.load(filename_start, map_location=device)
state_dict_end = torch.load(filename_end, map_location=device)
average_period = state_dict_start["average_period"]
batch_idx_train_start = state_dict_start["batch_idx_train"]
batch_idx_train_start = (batch_idx_train_start // average_period) * average_period
batch_idx_train_end = state_dict_end["batch_idx_train"]
batch_idx_train_end = (batch_idx_train_end // average_period) * average_period
interval = batch_idx_train_end - batch_idx_train_start
assert interval > 0, interval
weight_end = batch_idx_train_end / interval