larry1129 commited on
Commit
3305a62
1 Parent(s): b9d0bf3

Training complete, uploading model.

Browse files
Files changed (3) hide show
  1. README.md +1 -1
  2. adapter_config.json +5 -5
  3. training_args.bin +1 -1
README.md CHANGED
@@ -36,7 +36,7 @@ More information needed
36
  ### Training hyperparameters
37
 
38
  The following hyperparameters were used during training:
39
- - learning_rate: 0.0003
40
  - train_batch_size: 2
41
  - eval_batch_size: 8
42
  - seed: 3407
 
36
  ### Training hyperparameters
37
 
38
  The following hyperparameters were used during training:
39
+ - learning_rate: 5e-05
40
  - train_batch_size: 2
41
  - eval_batch_size: 8
42
  - seed: 3407
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "v_proj",
24
- "o_proj",
25
  "down_proj",
26
- "q_proj",
27
  "k_proj",
28
- "gate_proj",
29
- "up_proj"
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "gate_proj",
24
+ "up_proj",
25
  "down_proj",
 
26
  "k_proj",
27
+ "v_proj",
28
+ "q_proj",
29
+ "o_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24bc15ac067833831a0cf28ec96a7df5b55efa782ced4d8ef90ec53b2e30d4df
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3063e88840b41fd2c7a71f1114c0e322c097a7e6e6f8221418ab8138e241610
3
  size 5496