From 7f71572ab0d916dcd0989e9fad014391c04912e1 Mon Sep 17 00:00:00 2001 From: Sam Foreman Date: Fri, 13 Sep 2024 12:24:06 -0500 Subject: [PATCH] Update `megatron/training_log.py` --- megatron/training_log.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/megatron/training_log.py b/megatron/training_log.py index be2eacd059..cd6638e17d 100644 --- a/megatron/training_log.py +++ b/megatron/training_log.py @@ -397,7 +397,7 @@ def training_log( opt_stats, group=mpu.get_pipeline_model_parallel_group() ) # opt_stats_2 = opt_stats_2.clone().detach() - opt_stats_2 = accelerator.get_accelerator().FloatTensor(opt_stats_2) + opt_stats_2 = accelerator.FloatTensor(opt_stats_2) torch.distributed.all_reduce( opt_stats_2, op=torch.distributed.ReduceOp.MAX,