Merge pull request #35 from bhaskar0210s/master

fix: return inf instead of crashing when evaluate_bpb has zero total_bytes
This commit is contained in:
Andrej 2025-10-29 08:06:24 -07:00 committed by GitHub
commit 29ff38d94b
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -59,5 +59,7 @@ def evaluate_bpb(model, batches, steps, token_bytes):
# move both to cpu, calculate bpb and return # move both to cpu, calculate bpb and return
total_nats = total_nats.item() total_nats = total_nats.item()
total_bytes = total_bytes.item() total_bytes = total_bytes.item()
if total_bytes == 0:
return float('inf')
bpb = total_nats / (math.log(2) * total_bytes) bpb = total_nats / (math.log(2) * total_bytes)
return bpb return bpb