mirror of
https://github.com/karpathy/nanochat.git
synced 2025-12-06 04:12:13 +00:00
Update run1000.sh to add missing --run=$WANDB_RUN
This commit is contained in:
parent
cf587acb1a
commit
ba4f40bf58
|
|
@ -70,7 +70,7 @@ python -m scripts.tok_eval
|
||||||
# which would decrease model performance. Possibly 2, 3 or so epochs is ~ok, but certainly not ideal and at 10+ epochs we'd
|
# which would decrease model performance. Possibly 2, 3 or so epochs is ~ok, but certainly not ideal and at 10+ epochs we'd
|
||||||
# start to overfit hard.
|
# start to overfit hard.
|
||||||
# 5) That's it, everything else (e.g. the learning rates) is adjusted automatically by the training script.
|
# 5) That's it, everything else (e.g. the learning rates) is adjusted automatically by the training script.
|
||||||
torchrun --standalone --nproc_per_node=8 -m scripts.base_train -- --depth=32 --device_batch_size=8
|
torchrun --standalone --nproc_per_node=8 -m scripts.base_train -- --depth=32 --device_batch_size=8 --run=$WANDB_RUN
|
||||||
torchrun --standalone --nproc_per_node=8 -m scripts.base_loss
|
torchrun --standalone --nproc_per_node=8 -m scripts.base_loss
|
||||||
torchrun --standalone --nproc_per_node=8 -m scripts.base_eval
|
torchrun --standalone --nproc_per_node=8 -m scripts.base_eval
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue
Block a user