Spaces:
Paused
Paused
Update app.py
Browse files
app.py
CHANGED
@@ -213,13 +213,19 @@ trainer = QuestionAnsweringTrainer(
|
|
213 |
|
214 |
#################################################
|
215 |
# special Trainer Baize Model
|
216 |
-
# Parameters
|
217 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
218 |
BATCH_SIZE = 64
|
219 |
-
size =
|
220 |
GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // MICRO_BATCH_SIZE
|
221 |
EPOCHS = 1
|
222 |
-
LEARNING_RATE = float(
|
223 |
CUTOFF_LEN = 512
|
224 |
LORA_R = 8
|
225 |
LORA_ALPHA = 16
|
|
|
213 |
|
214 |
#################################################
|
215 |
# special Trainer Baize Model
|
216 |
+
# Parameters für Model 7b: 7b 32 0.0002
|
217 |
+
# Model 13b: 13b 16 0.0001
|
218 |
+
# Model 30b: 30b 8 0.00005
|
219 |
+
arg1 = '7b'
|
220 |
+
arg2 = 32
|
221 |
+
arg3 = 0.0002
|
222 |
+
|
223 |
+
MICRO_BATCH_SIZE = int(arg2)
|
224 |
BATCH_SIZE = 64
|
225 |
+
size = arg1
|
226 |
GRADIENT_ACCUMULATION_STEPS = BATCH_SIZE // MICRO_BATCH_SIZE
|
227 |
EPOCHS = 1
|
228 |
+
LEARNING_RATE = float(arg3)
|
229 |
CUTOFF_LEN = 512
|
230 |
LORA_R = 8
|
231 |
LORA_ALPHA = 16
|