mtasic85 commited on
Commit
11b5422
1 Parent(s): 4f006dd

pretrain model, extend from 8 to 7 epochs

Browse files
Files changed (1) hide show
  1. scripts/pretrain-model.yaml +1 -1
scripts/pretrain-model.yaml CHANGED
@@ -78,7 +78,7 @@ train:
78
  # Total number of tokens to train on (type: Optional[int], default: 3000000000000)
79
  # max_tokens: 3000000000000
80
  # max_tokens: 8159107755 # 796399 * 2049 * 5
81
- max_tokens: 13054572408 # 796399 * 2049 * 8
82
 
83
  # Limits the number of optimizer steps to run. (type: Optional[int], default: null)
84
  max_steps:
 
78
  # Total number of tokens to train on (type: Optional[int], default: 3000000000000)
79
  # max_tokens: 3000000000000
80
  # max_tokens: 8159107755 # 796399 * 2049 * 5
81
+ max_tokens: 11422750857 # 796399 * 2049 * 7
82
 
83
  # Limits the number of optimizer steps to run. (type: Optional[int], default: null)
84
  max_steps: