File size: 410 Bytes
c764ac2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
{
"model": "gpt2",
"dataset": "wikitext",
"subset": "wikitext-103-v1",
"output_dir": "output",
"num_epochs": 20,
"num_tokens": 100000000,
"window_size": 8,
"batch_size": 2048,
"learning_rate": 1e-05,
"warmup_steps": 3000,
"scheduler": "cosine",
"weight_decay": 0.1,
"random_seed": 42,
"eval_steps": 1000,
"patience": 5,
"id": "27a3016f17f9dd51"
} |