mirror of
https://github.com/karpathy/nanochat.git
synced 2026-02-03 00:59:55 +00:00
fix bug in chat_sft, the attention window must be preserved sigh
This commit is contained in:
parent
eaf49a33c8
commit
8b4849d548
|
|
@ -301,6 +301,7 @@ while True:
|
|||
"n_head": model.config.n_head,
|
||||
"n_kv_head": model.config.n_kv_head,
|
||||
"n_embd": model.config.n_embd,
|
||||
"window_pattern": model.config.window_pattern,
|
||||
},
|
||||
"user_config": user_config, # inputs to the training script
|
||||
}
|
||||
|
|
|
|||
Loading…
Reference in New Issue
Block a user