File size: 410 Bytes
c764ac2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
{
    "model": "gpt2",
    "dataset": "wikitext",
    "subset": "wikitext-103-v1",
    "output_dir": "output",
    "num_epochs": 20,
    "num_tokens": 100000000,
    "window_size": 8,
    "batch_size": 2048,
    "learning_rate": 1e-05,
    "warmup_steps": 3000,
    "scheduler": "cosine",
    "weight_decay": 0.1,
    "random_seed": 42,
    "eval_steps": 1000,
    "patience": 5,
    "id": "27a3016f17f9dd51"
}