Hari7696 commited on
Commit
04d6458
·
verified ·
1 Parent(s): dd6567d

Hari7696/peft-ia3

Browse files
README.md CHANGED
@@ -33,13 +33,14 @@ More information needed
33
  ### Training hyperparameters
34
 
35
  The following hyperparameters were used during training:
36
- - learning_rate: 0.001
37
  - train_batch_size: 8
38
  - eval_batch_size: 8
39
  - seed: 42
40
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
41
  - lr_scheduler_type: linear
42
- - num_epochs: 2
 
43
 
44
  ### Training results
45
 
@@ -50,5 +51,5 @@ The following hyperparameters were used during training:
50
  - PEFT 0.12.0
51
  - Transformers 4.42.4
52
  - Pytorch 2.3.1+cu121
53
- - Datasets 2.20.0
54
  - Tokenizers 0.19.1
 
33
  ### Training hyperparameters
34
 
35
  The following hyperparameters were used during training:
36
+ - learning_rate: 0.003
37
  - train_batch_size: 8
38
  - eval_batch_size: 8
39
  - seed: 42
40
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
41
  - lr_scheduler_type: linear
42
+ - lr_scheduler_warmup_steps: 50
43
+ - num_epochs: 4
44
 
45
  ### Training results
46
 
 
51
  - PEFT 0.12.0
52
  - Transformers 4.42.4
53
  - Pytorch 2.3.1+cu121
54
+ - Datasets 2.21.0
55
  - Tokenizers 0.19.1
adapter_config.json CHANGED
@@ -11,8 +11,10 @@
11
  "peft_type": "IA3",
12
  "revision": null,
13
  "target_modules": [
 
 
14
  "v",
15
- "q"
16
  ],
17
  "task_type": "SEQ_2_SEQ_LM"
18
  }
 
11
  "peft_type": "IA3",
12
  "revision": null,
13
  "target_modules": [
14
+ "k",
15
+ "q",
16
  "v",
17
+ "o"
18
  ],
19
  "task_type": "SEQ_2_SEQ_LM"
20
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1c9dc6003639d7d38984860d36c7a9c38dcac88cc070132a2442b742af65587
3
- size 230432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f2a78c02265fbfaeac6c5725eeaade5ee667aa6e5aabab19ef05308ea7ac247
3
+ size 460888
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:420a0644455b70b18e0d63169d82689c4097655ffdc0c3701ba1815de8abfd8f
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c286501d83149fd15352a50b349d8b9d04bc2d4075f51ac7b8259928373311da
3
  size 5048