fix: cast bf16 to fp32 on MPS (like CPU) to avoid dtype issues

2025-12-06 04:12:13 +00:00 · 2025-11-03 16:00:56 -05:00 · 2025-11-03 16:00:56 -05:00 · 7a40ee77b4
commit 7a40ee77b4
parent a83646e098
1 changed files with 1 additions and 1 deletions
--- a/nanochat/checkpoint_manager.py
+++ b/nanochat/checkpoint_manager.py
@ -65,7 +65,7 @@ def build_model(checkpoint_dir, step, device, phase):
    """
    assert phase in ["train", "eval"], f"Invalid phase: {phase}"
    model_data, optimizer_data, meta_data = load_checkpoint(checkpoint_dir, step, device, load_optimizer=False)
-    if device.type == "cpu":
+    if device.type in {"cpu", "mps"}:
        # Convert bfloat16 tensors to float for CPU inference
        model_data = {
            k: v.float() if v.dtype == torch.bfloat16 else v