mirror of
https://github.com/karpathy/nanochat.git
synced 2025-12-06 04:12:13 +00:00
revert change of base to sft for quick inline test
This commit is contained in:
parent
b399e43168
commit
c6f5bd67db
|
|
@ -332,7 +332,7 @@ if __name__ == "__main__":
|
||||||
autocast_ctx = torch.amp.autocast(device_type=device_type, dtype=torch.bfloat16) if device_type == "cuda" else nullcontext()
|
autocast_ctx = torch.amp.autocast(device_type=device_type, dtype=torch.bfloat16) if device_type == "cuda" else nullcontext()
|
||||||
|
|
||||||
# load the model and tokenizer
|
# load the model and tokenizer
|
||||||
model, tokenizer, meta = load_model("sft", device, phase="eval")
|
model, tokenizer, meta = load_model("base", device, phase="eval")
|
||||||
bos_token_id = tokenizer.get_bos_token_id()
|
bos_token_id = tokenizer.get_bos_token_id()
|
||||||
# common hyperparameters
|
# common hyperparameters
|
||||||
kwargs = dict(max_tokens=64, temperature=0.0)
|
kwargs = dict(max_tokens=64, temperature=0.0)
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue
Block a user