fix bug in chat_sft, the attention window must be preserved sigh

This commit is contained in:
Andrej Karpathy 2026-02-01 20:58:44 +00:00
parent eaf49a33c8
commit 8b4849d548

View File

@ -301,6 +301,7 @@ while True:
"n_head": model.config.n_head,
"n_kv_head": model.config.n_kv_head,
"n_embd": model.config.n_embd,
"window_pattern": model.config.window_pattern,
},
"user_config": user_config, # inputs to the training script
}