fix sft checkpoint dir to match load_model (sft_checkpoints -> chatsft_checkpoints)

This commit is contained in:
Dane Claessen 2026-02-01 03:58:58 -06:00
parent 31b61d2d17
commit ea34b62743
No known key found for this signature in database

View File

@ -285,7 +285,7 @@ while True:
# save checkpoint at the end of the run (only on master process)
if master_process and last_step and not args.dry_run:
output_dirname = args.model_tag if args.model_tag else f"d{depth}" # e.g. d12
checkpoint_dir = os.path.join(base_dir, "sft_checkpoints", output_dirname)
checkpoint_dir = os.path.join(base_dir, "chatsft_checkpoints", output_dirname)
save_checkpoint(
checkpoint_dir,
step,