From 32ce342c8848eeaf09d298690923a078f40ac20e Mon Sep 17 00:00:00 2001 From: svlandeg Date: Tue, 30 Dec 2025 11:32:47 +0100 Subject: [PATCH] remove batch_num_tokens definition which was only used for experiment logging --- scripts/chat_sft.py | 1 - 1 file changed, 1 deletion(-) diff --git a/scripts/chat_sft.py b/scripts/chat_sft.py index 65b75f2..4afb96f 100644 --- a/scripts/chat_sft.py +++ b/scripts/chat_sft.py @@ -219,7 +219,6 @@ for step in range(num_iterations): dist.all_reduce(num_tokens, op=dist.ReduceOp.SUM) # sum over ranks for micro_step, (train_inputs, train_targets) in enumerate(steps): - batch_num_tokens = (train_targets >= 0).sum() with autocast_ctx: loss = model(train_inputs, train_targets, loss_reduction='sum') loss = loss / num_tokens # normalize loss here