mirror of
https://github.com/karpathy/nanochat.git
synced 2026-03-04 16:30:28 +00:00
Merge pull request #1 from Dianababaei/feat/gpt-add-kvcache-import
Update GPT model configuration and initialization parameters in GPTConfig class
This commit is contained in:
commit
d44a3e090f
|
|
@ -22,6 +22,7 @@ import torch.nn.functional as F
|
|||
from nanochat.common import get_dist_info, print0
|
||||
from nanochat.muon import Muon, DistMuon
|
||||
from nanochat.adamw import DistAdamW
|
||||
from nanochat.engine import KVCache
|
||||
|
||||
@dataclass
|
||||
class GPTConfig:
|
||||
|
|
|
|||
Loading…
Reference in New Issue
Block a user