tangledgroup
/

tangled-llama-u-128k-base-v0.1

@@ -78,7 +78,7 @@ train:
   # Total number of tokens to train on (type: Optional[int], default: 3000000000000)
   # max_tokens: 3000000000000
   # max_tokens: 8159107755 # 796399 * 2049 * 5
-  max_tokens: 13054572408 # 796399 * 2049 * 8
   # Limits the number of optimizer steps to run. (type: Optional[int], default: null)
   max_steps:

   # Total number of tokens to train on (type: Optional[int], default: 3000000000000)
   # max_tokens: 3000000000000
   # max_tokens: 8159107755 # 796399 * 2049 * 5
+  max_tokens: 11422750857 # 796399 * 2049 * 7
   # Limits the number of optimizer steps to run. (type: Optional[int], default: null)
   max_steps: