mirror of
https://github.com/karpathy/nanochat.git
synced 2025-12-06 04:12:13 +00:00
Merge a33d04dca1 into 4a87a0d19f
This commit is contained in:
commit
99278a6e41
|
|
@ -6,6 +6,9 @@ Example tasks: MMLU, ARC-Easy, ARC-Challenge, GSM8K, HumanEval, SmolTalk.
|
|||
"""
|
||||
|
||||
import random
|
||||
import logging
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
class Task:
|
||||
"""
|
||||
|
|
@ -34,7 +37,18 @@ class Task:
|
|||
|
||||
def __len__(self):
|
||||
start = self.start
|
||||
stop = self.num_examples() if self.stop is None else self.stop
|
||||
if self.stop is not None:
|
||||
num_ex = self.num_examples()
|
||||
if self.stop > num_ex:
|
||||
# Warn once, then cap stop
|
||||
logger.warning(
|
||||
f"Stop parameter ({self.stop}) exceeds dataset size ({num_ex}). "
|
||||
f"Using {num_ex} examples instead."
|
||||
)
|
||||
self.stop = num_ex
|
||||
stop = self.stop
|
||||
else:
|
||||
stop = self.num_examples()
|
||||
step = self.step
|
||||
span = stop - start
|
||||
num = (span + step - 1) // step # ceil_div(span, step)
|
||||
|
|
|
|||
Loading…
Reference in New Issue
Block a user