File size: 496 Bytes
a60e942
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
453069f
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
from dataclasses import dataclass


@dataclass
class ModelConfig:
    # Model architecture
    n_embeds: int = 384
    n_heads: int = 6
    n_layers: int = 6
    dropout: float = 0.3

    # Training
    batch_size: int = 64
    block_size: int = 128
    max_iters: int = 20000
    eval_interval: int = 250
    eval_iters: int = 200
    learning_rate: float = 3e-4
    weight_decay: float = 0.1

    # Paths
    checkpoint_path: str = "checkpoints/model.pth"
    data_path: str = "data/input.txt"