From d1fc8c5d0554e6056d70cca7a147b305237c9cf4 Mon Sep 17 00:00:00 2001
From: Sachin Agrawal <sachinagrawal@Mac.fritz.box>
Date: Mon, 3 Nov 2025 22:09:10 +0100
Subject: [PATCH] fixing deleted text issue

---
 speedrun.sh | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/speedrun.sh b/speedrun.sh
index c89331c7..7a98b40f 100644
--- a/speedrun.sh
+++ b/speedrun.sh
@@ -16,7 +16,7 @@ export NANOCHAT_BASE_DIR="$HOME/.cache/nanochat"
 mkdir -p $NANOCHAT_BASE_DIR
 
 # Number of processes per node for distributed training
-NPROC_PER_NODE=8
+NPROC_PER_NODE=4
 
 # -----------------------------------------------------------------------------
 # Python venv setup with uv
@@ -96,6 +96,10 @@ torchrun --standalone --nproc_per_node=$NPROC_PER_NODE -m scripts.base_eval
 # -----------------------------------------------------------------------------
 # Midtraining (teach the model conversation special tokens, tool use, multiple choice)
 
+# download 2.3MB of synthetic identity conversations to impart a personality to nanochat
+# see dev/gen_sft_data.py for details on how this data was prepared and to get a sense of how you can easily tune it
+curl -L -o $NANOCHAT_BASE_DIR/identity_conversations.jsonl https://karpathy-public.s3.us-west-2.amazonaws.com/identity_conversations.jsonl
+
 # run midtraining and eval the model
 torchrun --standalone --nproc_per_node=$NPROC_PER_NODE -m scripts.mid_train -- --run=$WANDB_RUN
 torchrun --standalone --nproc_per_node=$NPROC_PER_NODE -m scripts.chat_eval -- -i mid