BroBro87 commited on
Commit
988e0c2
1 Parent(s): d1e3ad5

End of training

Browse files
README.md CHANGED
@@ -18,7 +18,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [stabilityai/stablelm-zephyr-3b](https://huggingface.co/stabilityai/stablelm-zephyr-3b) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 6.4023
22
 
23
  ## Model description
24
 
@@ -50,12 +50,31 @@ The following hyperparameters were used during training:
50
 
51
  ### Training results
52
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
53
 
54
 
55
  ### Framework versions
56
 
57
  - PEFT 0.9.0
58
  - Transformers 4.38.2
59
- - Pytorch 2.1.2+cu121
60
  - Datasets 2.18.0
61
  - Tokenizers 0.15.2
 
18
 
19
  This model is a fine-tuned version of [stabilityai/stablelm-zephyr-3b](https://huggingface.co/stabilityai/stablelm-zephyr-3b) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 3.4473
22
 
23
  ## Model description
24
 
 
50
 
51
  ### Training results
52
 
53
+ | Training Loss | Epoch | Step | Validation Loss |
54
+ |:-------------:|:-----:|:----:|:---------------:|
55
+ | No log | 0.56 | 1 | 2.9512 |
56
+ | No log | 1.67 | 3 | 2.9727 |
57
+ | No log | 2.78 | 5 | 3.2578 |
58
+ | No log | 3.89 | 7 | 2.9238 |
59
+ | No log | 5.0 | 9 | 3.3867 |
60
+ | 0.916 | 5.56 | 10 | 3.3066 |
61
+ | 0.916 | 6.67 | 12 | 3.2090 |
62
+ | 0.916 | 7.78 | 14 | 3.4980 |
63
+ | 0.916 | 8.89 | 16 | 3.5098 |
64
+ | 0.916 | 10.0 | 18 | 3.4434 |
65
+ | 0.916 | 10.56 | 19 | 3.4375 |
66
+ | 0.1354 | 11.67 | 21 | 3.4238 |
67
+ | 0.1354 | 12.78 | 23 | 3.4336 |
68
+ | 0.1354 | 13.89 | 25 | 3.4473 |
69
+ | 0.1354 | 15.0 | 27 | 3.4492 |
70
+ | 0.1354 | 15.56 | 28 | 3.4492 |
71
+ | 0.0754 | 16.67 | 30 | 3.4473 |
72
 
73
 
74
  ### Framework versions
75
 
76
  - PEFT 0.9.0
77
  - Transformers 4.38.2
78
+ - Pytorch 2.1.0+cu121
79
  - Datasets 2.18.0
80
  - Tokenizers 0.15.2
adapter_config.json CHANGED
@@ -19,13 +19,13 @@
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
22
- "down_proj",
23
  "k_proj",
24
- "o_proj",
25
- "q_proj",
26
  "up_proj",
27
  "gate_proj",
28
- "v_proj"
 
 
 
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_dora": false,
 
19
  "rank_pattern": {},
20
  "revision": null,
21
  "target_modules": [
 
22
  "k_proj",
 
 
23
  "up_proj",
24
  "gate_proj",
25
+ "v_proj",
26
+ "down_proj",
27
+ "o_proj",
28
+ "q_proj"
29
  ],
30
  "task_type": "CAUSAL_LM",
31
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e44ce263e6fd885f50d82ca515b9325375b43ee36ededb75acf161ce88bc2e41
3
- size 48
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff067eb0d24d6ac677cadfb8c1d21e9e59f8757a225366830ffdefb6711bca47
3
+ size 801172960
runs/Mar13_10-17-13_6e2c9b113eb3/events.out.tfevents.1710325034.6e2c9b113eb3.153.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2a2107835eead15477ebad78e5ebe4ce72f8d9112d4f3d1d935df4d76024d80
3
+ size 5104
runs/Mar13_10-17-41_6e2c9b113eb3/events.out.tfevents.1710325062.6e2c9b113eb3.153.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83bfcbc5f4ed8aec3c46ed95e400ea108c0df213f7233f7833a54fe7316cc9c8
3
+ size 13935
runs/Mar13_10-17-41_6e2c9b113eb3/events.out.tfevents.1710325549.6e2c9b113eb3.153.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20ef89c3a4db7f2a03ca1717df043d5c8aa5f16c24f4727e7b1c8877728826e0
3
+ size 354
runs/Mar13_10-26-32_6e2c9b113eb3/events.out.tfevents.1710325593.6e2c9b113eb3.153.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5957b224a966b23f239b9269b97cbeaea98cfe2aaf4ee6677bf7008910dfec0
3
+ size 10595
runs/Mar13_10-26-32_6e2c9b113eb3/events.out.tfevents.1710325885.6e2c9b113eb3.153.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b952392a880e41e94dde187919c6ef0690a75f9e9fa48c489595215596a376a9
3
+ size 354
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3aa663e6169809153a242be034068df0397a9a316586710ff0a0bab8c5f39dda
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e1b006c398a102784e93bbad6860bfc91328a0b6e4dfe64dead070a31c3d334
3
  size 4920