File size: 375 Bytes
5a36696
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
097622b
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
{    
    "model":  {
        "vocab_size": 8192,
        "context_length": 128,
        "d_embedding": 512,
        "d_intermediate": 2048,
        "n_heads": 16,
        "n_layers": 16,
        "qkv_bias": false
    },
    "train": {
        "peak_lr": 0.001,
        "warmup_ratio": 0.01,
        "n_epochs": 2,
        "batch_size": 8,
        "weight_decay": 0.1
    }
}