alexkueck commited on
Commit
d329db5
·
1 Parent(s): 4f8b6a1

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -4
app.py CHANGED
@@ -213,13 +213,19 @@ trainer = QuestionAnsweringTrainer(
213
 
214
  #################################################
215
  # special Trainer Baize Model
216
- # Parameters
217
- MICRO_BATCH_SIZE = int(sys.argv[2])
 
 
 
 
 
 
218
  BATCH_SIZE = 64
219
- size = sys.argv[1]
220
  GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // MICRO_BATCH_SIZE
221
  EPOCHS = 1
222
- LEARNING_RATE = float(sys.argv[3])
223
  CUTOFF_LEN = 512
224
  LORA_R = 8
225
  LORA_ALPHA = 16
 
213
 
214
  #################################################
215
  # special Trainer Baize Model
216
+ # Parameters für Model 7b: 7b 32 0.0002
217
+ # Model 13b: 13b 16 0.0001
218
+ # Model 30b: 30b 8 0.00005
219
+ arg1 = '7b'
220
+ arg2 = 32
221
+ arg3 = 0.0002
222
+
223
+ MICRO_BATCH_SIZE = int(arg2)
224
  BATCH_SIZE = 64
225
+ size = arg1
226
  GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // MICRO_BATCH_SIZE
227
  EPOCHS = 1
228
+ LEARNING_RATE = float(arg3)
229
  CUTOFF_LEN = 512
230
  LORA_R = 8
231
  LORA_ALPHA = 16