mirror of
https://github.com/karpathy/nanochat.git
synced 2026-06-15 02:29:09 +00:00
using the orig_model for sample.
This commit is contained in:
parent
3d55b1df96
commit
3dbf6adf4f
|
|
@ -408,7 +408,7 @@ while True:
|
|||
# use the original uncompiled model because the inputs keep changing shape
|
||||
if args.sample_every > 0 and master_process and (last_step or (step > 0 and step % args.sample_every == 0)):
|
||||
model.eval()
|
||||
evaluate_sample(model, tokenizer, lambda x:print0(x), True)
|
||||
evaluate_sample(orig_model, tokenizer, lambda x:print0(x), True)
|
||||
model.train()
|
||||
|
||||
# save checkpoint: at the end of the run, or every save_every steps, except at the first step or the resume step
|
||||
|
|
|
|||
Loading…
Reference in New Issue
Block a user