File size: 409 Bytes
73d6383
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
{
  "accumulate_grad_batches": 64,
  "auxk": 256,
  "auxk_coef": 0.03125,
  "batch_size": 1,
  "dead_steps_threshold": null,
  "dead_threshold": 0.001,
  "dead_tokens_threshold": 10000000,
  "expansion_factor": 64,
  "k": 64,
  "layers": null,
  "lr": 0.0001,
  "max_length": 2048,
  "model_name": "EleutherAI/pythia-160m-deduped",
  "skip_special_tokens": true,
  "standardize": true,
  "tuned_lens": false
}