mirror of
https://github.com/karpathy/nanochat.git
synced 2025-12-06 04:12:13 +00:00
Merge pull request #9 from LokiMetaSmith/fix-dataloader-typeerror
Fix TypeError in tokenizing_distributed_data_loader and robustness in…
This commit is contained in:
commit
104308cf78
|
|
@ -26,7 +26,9 @@ def print0(s="",**kwargs):
|
||||||
for arg in sys.argv[1:]:
|
for arg in sys.argv[1:]:
|
||||||
if '=' not in arg:
|
if '=' not in arg:
|
||||||
# assume it's the name of a config file
|
# assume it's the name of a config file
|
||||||
assert not arg.startswith('--')
|
if arg.startswith('--'):
|
||||||
|
# ignore flags like --help or others without =
|
||||||
|
continue
|
||||||
config_file = arg
|
config_file = arg
|
||||||
print0(f"Overriding config with {config_file}:")
|
print0(f"Overriding config with {config_file}:")
|
||||||
with open(config_file) as f:
|
with open(config_file) as f:
|
||||||
|
|
|
||||||
|
|
@ -81,7 +81,8 @@ def tokenizing_distributed_data_loader_with_state(B, T, split, tokenizer_threads
|
||||||
state_dict = {"pq_idx": pq_idx, "rg_idx": rg_idx} # we need this in case we wish to approximately resume training
|
state_dict = {"pq_idx": pq_idx, "rg_idx": rg_idx} # we need this in case we wish to approximately resume training
|
||||||
yield inputs, targets, state_dict
|
yield inputs, targets, state_dict
|
||||||
|
|
||||||
def tokenizing_distributed_data_loader(*args, **kwargs):
|
def tokenizing_distributed_data_loader(*args, device="cuda", **kwargs):
|
||||||
# helper function that only emits the inputs/targets and not the state_dict
|
# helper function that only emits the inputs/targets and not the state_dict
|
||||||
|
kwargs["device"] = device
|
||||||
for inputs, targets, state_dict in tokenizing_distributed_data_loader_with_state(*args, **kwargs):
|
for inputs, targets, state_dict in tokenizing_distributed_data_loader_with_state(*args, **kwargs):
|
||||||
yield inputs, targets
|
yield inputs, targets
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue
Block a user