mirror of
https://github.com/osmarks/nanogpt-experiments.git
synced 2024-12-18 14:10:28 +00:00
commit
fb52554ca8
2
model.py
2
model.py
@ -90,7 +90,7 @@ class Block(nn.Module):
|
|||||||
x = x + self.mlp(self.ln_2(x))
|
x = x + self.mlp(self.ln_2(x))
|
||||||
return x
|
return x
|
||||||
|
|
||||||
@dataclass
|
@dataclass(frozen=True)
|
||||||
class GPTConfig:
|
class GPTConfig:
|
||||||
block_size: int = 1024
|
block_size: int = 1024
|
||||||
vocab_size: int = 50257
|
vocab_size: int = 50257
|
||||||
|
Loading…
Reference in New Issue
Block a user