Spaces:

tykiww
/

lora_instruction_tuning

Paused

tykiww commited on Jul 13, 2024

Commit

c5ce72e

verified ·

1 Parent(s): 7ebc9c5

Update config/config.json

Files changed (1) hide show

config/config.json CHANGED Viewed

@@ -3,20 +3,22 @@
     "general": {
       "max_seq_length": 128,
       "seed": 42,
     },
     "peft": {
-      "r": 64,
       "alpha": 16,
       "dropout": 0,
       "bias": "none",
       "rslora": false,
-      "loftq_config": null
     },
     "sft": {
-      "output_dir": "outputs",
-      "num_train_epochs": null,
-      "dataset_text_field" = "text",
-      "max_steps": 60,
       "per_device_train_batch_size": 2,
       "gradient_accumulation_steps": 4,
       "learning_rate": 2e-4,
@@ -26,7 +28,7 @@
       "weight_decay": 0.01,
       "lr_scheduler_type": "linear",
       "dataset_num_proc": 2,
-      "packing": false
     },
     "choices": ["gpt2", "bert-base-uncased", "llama3-8b"]
   }

     "general": {
       "max_seq_length": 128,
       "seed": 42,
+      "num_train_epochs": null,
+      "max_steps": 60,
+      "dataset_text_field" = "text",
+      "model_name": null,
+      "repository": null,
     },
     "peft": {
+      "r": 64, # choose from 8, 16, 32, 64
       "alpha": 16,
       "dropout": 0,
       "bias": "none",
       "rslora": false,
+      "loftq_config": null,
     },
     "sft": {
       "per_device_train_batch_size": 2,
       "gradient_accumulation_steps": 4,
       "learning_rate": 2e-4,
       "weight_decay": 0.01,
       "lr_scheduler_type": "linear",
       "dataset_num_proc": 2,
+      "packing": false,
     },
     "choices": ["gpt2", "bert-base-uncased", "llama3-8b"]
   }