allknowingroger
commited on
Commit
•
1a20ffc
1
Parent(s):
9949150
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- README.md +38 -0
- added_tokens.json +5 -0
- config.json +28 -0
- mergekit_config.yml +8 -0
- merges.txt +0 -0
- model-00001-of-00063.safetensors +3 -0
- model-00002-of-00063.safetensors +3 -0
- model-00003-of-00063.safetensors +3 -0
- model-00004-of-00063.safetensors +3 -0
- model-00005-of-00063.safetensors +3 -0
- model-00006-of-00063.safetensors +3 -0
- model-00007-of-00063.safetensors +3 -0
- model-00008-of-00063.safetensors +3 -0
- model-00009-of-00063.safetensors +3 -0
- model-00010-of-00063.safetensors +3 -0
- model-00011-of-00063.safetensors +3 -0
- model-00012-of-00063.safetensors +3 -0
- model-00013-of-00063.safetensors +3 -0
- model-00014-of-00063.safetensors +3 -0
- model-00015-of-00063.safetensors +3 -0
- model-00016-of-00063.safetensors +3 -0
- model-00017-of-00063.safetensors +3 -0
- model-00018-of-00063.safetensors +3 -0
- model-00019-of-00063.safetensors +3 -0
- model-00020-of-00063.safetensors +3 -0
- model-00021-of-00063.safetensors +3 -0
- model-00022-of-00063.safetensors +3 -0
- model-00023-of-00063.safetensors +3 -0
- model-00024-of-00063.safetensors +3 -0
- model-00025-of-00063.safetensors +3 -0
- model-00026-of-00063.safetensors +3 -0
- model-00027-of-00063.safetensors +3 -0
- model-00028-of-00063.safetensors +3 -0
- model-00029-of-00063.safetensors +3 -0
- model-00030-of-00063.safetensors +3 -0
- model-00031-of-00063.safetensors +3 -0
- model-00032-of-00063.safetensors +3 -0
- model-00033-of-00063.safetensors +3 -0
- model-00034-of-00063.safetensors +3 -0
- model-00035-of-00063.safetensors +3 -0
- model-00036-of-00063.safetensors +3 -0
- model-00037-of-00063.safetensors +3 -0
- model-00038-of-00063.safetensors +3 -0
- model-00039-of-00063.safetensors +3 -0
- model-00040-of-00063.safetensors +3 -0
- model-00041-of-00063.safetensors +3 -0
- model-00042-of-00063.safetensors +3 -0
- model-00043-of-00063.safetensors +3 -0
- model-00044-of-00063.safetensors +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
README.md
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model:
|
3 |
+
- smelborp/StellarDong-72b
|
4 |
+
library_name: transformers
|
5 |
+
tags:
|
6 |
+
- mergekit
|
7 |
+
- merge
|
8 |
+
|
9 |
+
---
|
10 |
+
# merge
|
11 |
+
|
12 |
+
This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
|
13 |
+
|
14 |
+
## Merge Details
|
15 |
+
### Merge Method
|
16 |
+
|
17 |
+
This model was merged using the SLERP merge method.
|
18 |
+
|
19 |
+
### Models Merged
|
20 |
+
|
21 |
+
The following models were included in the merge:
|
22 |
+
* [smelborp/StellarDong-72b](https://huggingface.co/smelborp/StellarDong-72b)
|
23 |
+
|
24 |
+
### Configuration
|
25 |
+
|
26 |
+
The following YAML configuration was used to produce this model:
|
27 |
+
|
28 |
+
```yaml
|
29 |
+
models:
|
30 |
+
- model: smelborp/StellarDong-72b
|
31 |
+
- model: smelborp/StellarDong-72b
|
32 |
+
merge_method: slerp
|
33 |
+
base_model: smelborp/StellarDong-72b
|
34 |
+
dtype: float32
|
35 |
+
parameters:
|
36 |
+
t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers
|
37 |
+
|
38 |
+
```
|
added_tokens.json
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|endoftext|>": 151643,
|
3 |
+
"<|im_end|>": 151645,
|
4 |
+
"<|im_start|>": 151644
|
5 |
+
}
|
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "smelborp/StellarDong-72b",
|
3 |
+
"architectures": [
|
4 |
+
"Qwen2ForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"eos_token_id": 151645,
|
8 |
+
"hidden_act": "silu",
|
9 |
+
"hidden_size": 8192,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 29568,
|
12 |
+
"max_position_embeddings": 32768,
|
13 |
+
"max_window_layers": 80,
|
14 |
+
"model_type": "qwen2",
|
15 |
+
"num_attention_heads": 64,
|
16 |
+
"num_hidden_layers": 80,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"rms_norm_eps": 1e-06,
|
19 |
+
"rope_scaling": null,
|
20 |
+
"rope_theta": 1000000.0,
|
21 |
+
"sliding_window": null,
|
22 |
+
"tie_word_embeddings": false,
|
23 |
+
"torch_dtype": "float32",
|
24 |
+
"transformers_version": "4.45.1",
|
25 |
+
"use_cache": false,
|
26 |
+
"use_sliding_window": false,
|
27 |
+
"vocab_size": 152064
|
28 |
+
}
|
mergekit_config.yml
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
models:
|
2 |
+
- model: smelborp/StellarDong-72b
|
3 |
+
- model: smelborp/StellarDong-72b
|
4 |
+
merge_method: slerp
|
5 |
+
base_model: smelborp/StellarDong-72b
|
6 |
+
dtype: float32
|
7 |
+
parameters:
|
8 |
+
t: [0, 0.5, 1, 0.5, 0] # V shaped curve: Hermes for input & output, WizardMath in the middle layers
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model-00001-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:863f5d8e584585e59ea591228de83103a91f3c2ec4999acc18ee2b0dc538ef99
|
3 |
+
size 4982833280
|
model-00002-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8da41188f3177ce8fd542aa6143fb6a64b168fcdb00324b32379d8c020657e2
|
3 |
+
size 4982866168
|
model-00003-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2890748e2124b69163cbb1785320a35bf75fc3df7bfd76b6b7b698c3836c584
|
3 |
+
size 4479624672
|
model-00004-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f97d31114ee35bf6afc72182c87ed6f3ffdc8cf21e116938c3dce2197768282
|
3 |
+
size 4479624680
|
model-00005-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfd20bff02b8223ad47e1fa9960871414930c726087c38859730a0a7b647d7b0
|
3 |
+
size 4781684776
|
model-00006-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58a5d1079434ab436e34b78230407aa1266ce419abb678f8b986fa50dea6baa1
|
3 |
+
size 4781651888
|
model-00007-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bb694bbc73f6349d7f961fd773089c5cf24a02422e2aaecfe39ba5eaf37a46b
|
3 |
+
size 4479624688
|
model-00008-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ed5a4fc146e2ccaa392465dbff099eb75d8a8cc420fbcc1541f8b5866274ed1
|
3 |
+
size 4781684776
|
model-00009-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaeeeae7eecd647fdac496b75034697e8e061cccc054099c9b8ded325e1c4040
|
3 |
+
size 4781651888
|
model-00010-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1294463a95cc60925809964a0e9cb913ca8a95887d97072b069acca3f79c512
|
3 |
+
size 4479624688
|
model-00011-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa41ef18008290d10fb1b4bc564030aa1aecd49993627d88b69f0c6507f6cb59
|
3 |
+
size 4781684776
|
model-00012-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61b3fe4608b6c599d5132187c3520b69f31539cb71a06dfb54ab24d505c78f71
|
3 |
+
size 4781651880
|
model-00013-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97556681d703dfac4d57e1348086487f67ddec7d9925d6f9dd2b11e3910599cc
|
3 |
+
size 4479624688
|
model-00014-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3577b81b7dde0113a2b1231b15232340b7d5666e02a8477e892f701fb6732af8
|
3 |
+
size 4781684776
|
model-00015-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb3880054c9e13f84250ad48d4258aca6c34c6b544dfa9a2583a58e21e6dd635
|
3 |
+
size 4781651888
|
model-00016-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:79d38a76003cf920e5b142a7d4692047b5d57c92ed0615969cc2f97ccf08833b
|
3 |
+
size 4479624688
|
model-00017-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4973580a5c7972f8d296784baaaf277cff57bf548c3209a815dad0955e81ac37
|
3 |
+
size 4781684776
|
model-00018-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3e16b3ca107a5416c3181b571aed3ef89acd54e7392688b939753ed0bb06213
|
3 |
+
size 4781651888
|
model-00019-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c20853079981396bb7a623a8efd0dcb64d9d4a7189fc3f31650b606b820f7220
|
3 |
+
size 4479624688
|
model-00020-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c8d70b67c63deeb46ee888e2526bdf9f8b29d96c9065408d602d931ce5c96a3
|
3 |
+
size 4781684768
|
model-00021-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3794abf4697c6aae312bf73b3b48005d2109051c294774ef17aca6fcfd9474bc
|
3 |
+
size 4781651888
|
model-00022-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35b904d7f3b7f1a03b74eebcf062b83928f2c917849def2412c5acf40c27b338
|
3 |
+
size 4479624688
|
model-00023-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:115beccebdcd68f624c17ad5f8f16063f21db04fcf75ceb4951f8070208c6d19
|
3 |
+
size 4781684776
|
model-00024-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a003c0457213c9d30e0438ffea67d39f88f6ba1b82b291c72665ef5ccaa57f20
|
3 |
+
size 4781651888
|
model-00025-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7066c3d8cd74346446656a57b2d8336d915797ba50b5a28d95a0b9914a17f9f4
|
3 |
+
size 4479624688
|
model-00026-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f23a598d8a07340b72795963b7ebd9d468e0f3750b619e87e4db096ebcd6165
|
3 |
+
size 4781684776
|
model-00027-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3950e4ef3ca56ca9dd60c110483c9623e401beca43bf07727850fa9604b57d44
|
3 |
+
size 4781651888
|
model-00028-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f13ba465e04b0750545128f4f4c8edeed040befe5ed17c7deeee97dc083bd9e
|
3 |
+
size 4479624688
|
model-00029-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:960eaf79b15cda7f091eb2687fa953f96705794a4d3d62e5a12e28ebe3274e6f
|
3 |
+
size 4781684768
|
model-00030-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18691353f5f720ef05990e91556b685c702dfc06f029f1baf9902e9f9b294aa6
|
3 |
+
size 4781651888
|
model-00031-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7adece308b8de81858578dbfa84147d3231a40dd35a497051e85279e04cbcd99
|
3 |
+
size 4479624688
|
model-00032-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7d7ba62c93d9f92d0ce63aaab73785e1479e09ebfabdbd65e1fb2c56e427459
|
3 |
+
size 4781684776
|
model-00033-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34629cf36edcd4d7551a86baff18fadfefbdd532c80e2f4db20df45afd17b17f
|
3 |
+
size 4781651888
|
model-00034-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:313a7f81bd734ec4056537fdb73cb178f6520e2e7f60109410a8f34ac6874044
|
3 |
+
size 4479624688
|
model-00035-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc3f0a10dc525465a64c75bf46a4ffd9781b02e92192484f7e89cbf924b3b31c
|
3 |
+
size 4781684776
|
model-00036-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c8684415e0ea3013bd7447375e08058ac86716aa2cb8f10728de0f58b81571a
|
3 |
+
size 4781651888
|
model-00037-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e0606d196a038622660f7251a676868b61cb35f2e624965a838bcf55b4ae08f3
|
3 |
+
size 4479624680
|
model-00038-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec9f97702c1bcbe02789e7bf14e6e98a071087c358166c3f6bbdbdf405bc843e
|
3 |
+
size 4781684776
|
model-00039-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0a341c0d3e92a3022e6192193735c77452e8cd0603541bb0ba463d7af7a63fa
|
3 |
+
size 4781651888
|
model-00040-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23c102b72b4910cfcc7b3047621f827b6e6b43e975ba0995ed06ac1848d0ea76
|
3 |
+
size 4479624688
|
model-00041-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10a8c74a738af46ba09313749841321445626e7e399f9b3edaff65bc3d8f8b59
|
3 |
+
size 4781684776
|
model-00042-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44aecafd5f6ab74168d74d5ce9d1179990422d0df33be53feed9fcf95c9e8128
|
3 |
+
size 4781651888
|
model-00043-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:454e7499921ca85fae5ae2be703b0ee837fb7b805aa281b5dd4ce81e3b40e11c
|
3 |
+
size 4479624688
|
model-00044-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0960c99b2a104b74c6095e8a4d9c3e2072caa239f7930b038655cd70ce397bc9
|
3 |
+
size 4781684776
|