From a8847a0f83d7a60be09d6762800feb204c3b4b64 Mon Sep 17 00:00:00 2001 From: KimYeongHyeon <32898945+KimYeongHyeon@users.noreply.github.com> Date: Tue, 2 Dec 2025 10:46:20 +0900 Subject: [PATCH] Fix script comment to reference correct file --- speedrun.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/speedrun.sh b/speedrun.sh index 7955ec5..501c176 100644 --- a/speedrun.sh +++ b/speedrun.sh @@ -96,7 +96,7 @@ torchrun --standalone --nproc_per_node=$NPROC_PER_NODE -m scripts.base_eval # Midtraining (teach the model conversation special tokens, tool use, multiple choice) # download 2.3MB of synthetic identity conversations to impart a personality to nanochat -# see dev/gen_sft_data.py for details on how this data was prepared and to get a sense of how you can easily tune it +# see dev/gen_synthetic_data.py for details on how this data was prepared and to get a sense of how you can easily tune it curl -L -o $NANOCHAT_BASE_DIR/identity_conversations.jsonl https://karpathy-public.s3.us-west-2.amazonaws.com/identity_conversations.jsonl # run midtraining and eval the model