mirror of
https://github.com/karpathy/nanochat.git
synced 2026-06-15 10:39:08 +00:00
claude suggested fix.
This commit is contained in:
parent
0725192e07
commit
0b6d93f3c2
|
|
@ -158,7 +158,7 @@ def flash_attn_with_kvcache(q, k_cache, v_cache, k=None, v=None, cache_seqlens=N
|
|||
q, k_cache, v_cache, k=k, v=v, cache_seqlens=cache_seqlens,
|
||||
causal=causal, window_size=window_size
|
||||
)
|
||||
y = XSA(y, v_cache)
|
||||
y = XSA(y, v)
|
||||
return y
|
||||
|
||||
# SDPA fallback: manually manage KV cache
|
||||
|
|
|
|||
Loading…
Reference in New Issue
Block a user