From ea34b627438309ccbcc0389bb0bea25e3f3363ae Mon Sep 17 00:00:00 2001 From: Dane Claessen Date: Sun, 1 Feb 2026 03:58:58 -0600 Subject: [PATCH] fix sft checkpoint dir to match load_model (sft_checkpoints -> chatsft_checkpoints) --- scripts/chat_sft.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/chat_sft.py b/scripts/chat_sft.py index 91300b6..5175f01 100644 --- a/scripts/chat_sft.py +++ b/scripts/chat_sft.py @@ -285,7 +285,7 @@ while True: # save checkpoint at the end of the run (only on master process) if master_process and last_step and not args.dry_run: output_dirname = args.model_tag if args.model_tag else f"d{depth}" # e.g. d12 - checkpoint_dir = os.path.join(base_dir, "sft_checkpoints", output_dirname) + checkpoint_dir = os.path.join(base_dir, "chatsft_checkpoints", output_dirname) save_checkpoint( checkpoint_dir, step,