mirror of
https://github.com/karpathy/nanochat.git
synced 2026-03-07 09:50:28 +00:00
Merge origin/master into muonh
Resolved conflicts: - nanochat/fp8.py: Kept _Float8MatmulND class from muonh - scripts/base_train.py: Kept dual lrm logging from muonh
This commit is contained in:
commit
330fa1188c
|
|
@ -271,6 +271,7 @@ class _Float8MatmulND(torch.autograd.Function):
|
|||
return grad_input, grad_weight
|
||||
|
||||
|
||||
|
||||
class Float8Linear(nn.Linear):
|
||||
"""Drop-in nn.Linear replacement that does FP8 compute.
|
||||
|
||||
|
|
|
|||
Loading…
Reference in New Issue
Block a user