Merge origin/master into muonh

Resolved conflicts:
- nanochat/fp8.py: Kept _Float8MatmulND class from muonh
- scripts/base_train.py: Kept dual lrm logging from muonh
This commit is contained in:
Kaiyue Wen 2026-02-12 21:30:17 -08:00
commit 330fa1188c

View File

@ -271,6 +271,7 @@ class _Float8MatmulND(torch.autograd.Function):
return grad_input, grad_weight
class Float8Linear(nn.Linear):
"""Drop-in nn.Linear replacement that does FP8 compute.