DewEfresh commited on
Commit
633ef31
1 Parent(s): 7485df8

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,158 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ base_model:
3
+ - DewEfresh/neo_7b
4
+ - DewEfresh/neo_7b
5
+ tags:
6
+ - merge
7
+ - mergekit
8
+ - lazymergekit
9
+ - DewEfresh/neo_7b
10
+ ---
11
+
12
+ # Neo_7b-merge10
13
+
14
+ Neo_7b-merge10 is a merge of the following models using [LazyMergekit](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb?usp=sharing):
15
+ * [DewEfresh/neo_7b](https://huggingface.co/DewEfresh/neo_7b)
16
+ * [DewEfresh/neo_7b](https://huggingface.co/DewEfresh/neo_7b)
17
+
18
+ ## 🧩 Configuration
19
+
20
+ ```yaml
21
+ slices:
22
+ - sources:
23
+ - model: DewEfresh/neo_7b
24
+ layer_range: [0, 0]
25
+ - model: DewEfresh/neo_7b
26
+ layer_range: [3, 3]
27
+ - sources:
28
+ - model: DewEfresh/neo_7b
29
+ layer_range: [1, 1]
30
+ - model: DewEfresh/neo_7b
31
+ layer_range: [3, 3]
32
+ - sources:
33
+ - model: DewEfresh/neo_7b
34
+ layer_range: [2, 2]
35
+ - model: DewEfresh/neo_7b
36
+ layer_range: [3, 3]
37
+ - sources:
38
+ - model: DewEfresh/neo_7b
39
+ layer_range: [4, 4]
40
+ - model: DewEfresh/neo_7b
41
+ layer_range: [7, 7]
42
+ - sources:
43
+ - model: DewEfresh/neo_7b
44
+ layer_range: [5, 5]
45
+ - model: DewEfresh/neo_7b
46
+ layer_range: [7, 7]
47
+ - sources:
48
+ - model: DewEfresh/neo_7b
49
+ layer_range: [6, 6]
50
+ - model: DewEfresh/neo_7b
51
+ layer_range: [7, 7]
52
+ - sources:
53
+ - model: DewEfresh/neo_7b
54
+ layer_range: [8, 8]
55
+ - model: DewEfresh/neo_7b
56
+ layer_range: [11, 11]
57
+ - sources:
58
+ - model: DewEfresh/neo_7b
59
+ layer_range: [9, 9]
60
+ - model: DewEfresh/neo_7b
61
+ layer_range: [11, 11]
62
+ - sources:
63
+ - model: DewEfresh/neo_7b
64
+ layer_range: [10, 10]
65
+ - model: DewEfresh/neo_7b
66
+ layer_range: [11, 11]
67
+ - sources:
68
+ - model: DewEfresh/neo_7b
69
+ layer_range: [12, 12]
70
+ - model: DewEfresh/neo_7b
71
+ layer_range: [15, 15]
72
+ - sources:
73
+ - model: DewEfresh/neo_7b
74
+ layer_range: [13, 13]
75
+ - model: DewEfresh/neo_7b
76
+ layer_range: [15, 15]
77
+ - sources:
78
+ - model: DewEfresh/neo_7b
79
+ layer_range: [14, 14]
80
+ - model: DewEfresh/neo_7b
81
+ layer_range: [15, 15]
82
+ - sources:
83
+ - model: DewEfresh/neo_7b
84
+ layer_range: [16, 16]
85
+ - model: DewEfresh/neo_7b
86
+ layer_range: [19, 19]
87
+ - sources:
88
+ - model: DewEfresh/neo_7b
89
+ layer_range: [17, 17]
90
+ - model: DewEfresh/neo_7b
91
+ layer_range: [19, 19]
92
+ - sources:
93
+ - model: DewEfresh/neo_7b
94
+ layer_range: [18, 18]
95
+ - model: DewEfresh/neo_7b
96
+ layer_range: [19, 19]
97
+ - sources:
98
+ - model: DewEfresh/neo_7b
99
+ layer_range: [20, 20]
100
+ - model: DewEfresh/neo_7b
101
+ layer_range: [23, 23]
102
+ - sources:
103
+ - model: DewEfresh/neo_7b
104
+ layer_range: [21, 21]
105
+ - model: DewEfresh/neo_7b
106
+ layer_range: [23, 23]
107
+ - sources:
108
+ - model: DewEfresh/neo_7b
109
+ layer_range: [22, 22]
110
+ - model: DewEfresh/neo_7b
111
+ layer_range: [23, 23]
112
+ - sources:
113
+ - model: DewEfresh/neo_7b
114
+ layer_range: [24, 24]
115
+ - model: DewEfresh/neo_7b
116
+ layer_range: [27, 27]
117
+ - sources:
118
+ - model: DewEfresh/neo_7b
119
+ layer_range: [25, 25]
120
+ - model: DewEfresh/neo_7b
121
+ layer_range: [27, 27]
122
+ - sources:
123
+ - model: DewEfresh/neo_7b
124
+ layer_range: [26, 26]
125
+ - model: DewEfresh/neo_7b
126
+ layer_range: [27, 27]
127
+ merge_method: slerp
128
+ base_model: DewEfresh/neo_7b
129
+ parameters:
130
+ t: 0.5
131
+ dtype: bfloat16
132
+
133
+ ```
134
+
135
+ ## 💻 Usage
136
+
137
+ ```python
138
+ !pip install -qU transformers accelerate
139
+
140
+ from transformers import AutoTokenizer
141
+ import transformers
142
+ import torch
143
+
144
+ model = "DewEfresh/Neo_7b-merge10"
145
+ messages = [{"role": "user", "content": "What is a large language model?"}]
146
+
147
+ tokenizer = AutoTokenizer.from_pretrained(model)
148
+ prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
149
+ pipeline = transformers.pipeline(
150
+ "text-generation",
151
+ model=model,
152
+ torch_dtype=torch.float16,
153
+ device_map="auto",
154
+ )
155
+
156
+ outputs = pipeline(prompt, max_new_tokens=256, do_sample=True, temperature=0.7, top_k=50, top_p=0.95)
157
+ print(outputs[0]["generated_text"])
158
+ ```
added_tokens.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "<|CLS|>": 64000,
3
+ "<|EOD|>": 64002,
4
+ "<|MASK|>": 64003,
5
+ "<|PAD|>": 64004,
6
+ "<|SEP|>": 64001
7
+ }
config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "DewEfresh/neo_7b",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 2,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 3072,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 8192,
15
+ "mlp_bias": false,
16
+ "model_type": "llama",
17
+ "num_attention_heads": 16,
18
+ "num_hidden_layers": 0,
19
+ "num_key_value_heads": 16,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-05,
22
+ "rope_scaling": null,
23
+ "rope_theta": 10000.0,
24
+ "tie_word_embeddings": false,
25
+ "torch_dtype": "bfloat16",
26
+ "transformers_version": "4.42.3",
27
+ "use_cache": true,
28
+ "vocab_size": 64256
29
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ slices:
3
+ - sources:
4
+ - model: DewEfresh/neo_7b
5
+ layer_range: [0, 0]
6
+ - model: DewEfresh/neo_7b
7
+ layer_range: [3, 3]
8
+ - sources:
9
+ - model: DewEfresh/neo_7b
10
+ layer_range: [1, 1]
11
+ - model: DewEfresh/neo_7b
12
+ layer_range: [3, 3]
13
+ - sources:
14
+ - model: DewEfresh/neo_7b
15
+ layer_range: [2, 2]
16
+ - model: DewEfresh/neo_7b
17
+ layer_range: [3, 3]
18
+ - sources:
19
+ - model: DewEfresh/neo_7b
20
+ layer_range: [4, 4]
21
+ - model: DewEfresh/neo_7b
22
+ layer_range: [7, 7]
23
+ - sources:
24
+ - model: DewEfresh/neo_7b
25
+ layer_range: [5, 5]
26
+ - model: DewEfresh/neo_7b
27
+ layer_range: [7, 7]
28
+ - sources:
29
+ - model: DewEfresh/neo_7b
30
+ layer_range: [6, 6]
31
+ - model: DewEfresh/neo_7b
32
+ layer_range: [7, 7]
33
+ - sources:
34
+ - model: DewEfresh/neo_7b
35
+ layer_range: [8, 8]
36
+ - model: DewEfresh/neo_7b
37
+ layer_range: [11, 11]
38
+ - sources:
39
+ - model: DewEfresh/neo_7b
40
+ layer_range: [9, 9]
41
+ - model: DewEfresh/neo_7b
42
+ layer_range: [11, 11]
43
+ - sources:
44
+ - model: DewEfresh/neo_7b
45
+ layer_range: [10, 10]
46
+ - model: DewEfresh/neo_7b
47
+ layer_range: [11, 11]
48
+ - sources:
49
+ - model: DewEfresh/neo_7b
50
+ layer_range: [12, 12]
51
+ - model: DewEfresh/neo_7b
52
+ layer_range: [15, 15]
53
+ - sources:
54
+ - model: DewEfresh/neo_7b
55
+ layer_range: [13, 13]
56
+ - model: DewEfresh/neo_7b
57
+ layer_range: [15, 15]
58
+ - sources:
59
+ - model: DewEfresh/neo_7b
60
+ layer_range: [14, 14]
61
+ - model: DewEfresh/neo_7b
62
+ layer_range: [15, 15]
63
+ - sources:
64
+ - model: DewEfresh/neo_7b
65
+ layer_range: [16, 16]
66
+ - model: DewEfresh/neo_7b
67
+ layer_range: [19, 19]
68
+ - sources:
69
+ - model: DewEfresh/neo_7b
70
+ layer_range: [17, 17]
71
+ - model: DewEfresh/neo_7b
72
+ layer_range: [19, 19]
73
+ - sources:
74
+ - model: DewEfresh/neo_7b
75
+ layer_range: [18, 18]
76
+ - model: DewEfresh/neo_7b
77
+ layer_range: [19, 19]
78
+ - sources:
79
+ - model: DewEfresh/neo_7b
80
+ layer_range: [20, 20]
81
+ - model: DewEfresh/neo_7b
82
+ layer_range: [23, 23]
83
+ - sources:
84
+ - model: DewEfresh/neo_7b
85
+ layer_range: [21, 21]
86
+ - model: DewEfresh/neo_7b
87
+ layer_range: [23, 23]
88
+ - sources:
89
+ - model: DewEfresh/neo_7b
90
+ layer_range: [22, 22]
91
+ - model: DewEfresh/neo_7b
92
+ layer_range: [23, 23]
93
+ - sources:
94
+ - model: DewEfresh/neo_7b
95
+ layer_range: [24, 24]
96
+ - model: DewEfresh/neo_7b
97
+ layer_range: [27, 27]
98
+ - sources:
99
+ - model: DewEfresh/neo_7b
100
+ layer_range: [25, 25]
101
+ - model: DewEfresh/neo_7b
102
+ layer_range: [27, 27]
103
+ - sources:
104
+ - model: DewEfresh/neo_7b
105
+ layer_range: [26, 26]
106
+ - model: DewEfresh/neo_7b
107
+ layer_range: [27, 27]
108
+ merge_method: slerp
109
+ base_model: DewEfresh/neo_7b
110
+ parameters:
111
+ t: 0.5
112
+ dtype: bfloat16
113
+
model-00001-of-00001.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41209159383a6438fa1e73146df470aae582c40bf510ec2495a3f8780477ce87
3
+ size 789584192
model.safetensors.index.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"metadata": {"mergekit_version": "0.0.4.4", "total_size": 789583872}, "weight_map": {"lm_head.weight": "model-00001-of-00001.safetensors", "model.embed_tokens.weight": "model-00001-of-00001.safetensors", "model.norm.weight": "model-00001-of-00001.safetensors"}}
special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|CLS|>",
4
+ "<|SEP|>",
5
+ "<|EOD|>",
6
+ "<|MASK|>",
7
+ "<|PAD|>"
8
+ ],
9
+ "bos_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": true
22
+ },
23
+ "pad_token": {
24
+ "content": "<unk>",
25
+ "lstrip": false,
26
+ "normalized": true,
27
+ "rstrip": false,
28
+ "single_word": true
29
+ },
30
+ "unk_token": {
31
+ "content": "<unk>",
32
+ "lstrip": false,
33
+ "normalized": true,
34
+ "rstrip": false,
35
+ "single_word": true
36
+ }
37
+ }
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6a2447b0e5664cabb2481587597102d82f42f0ccb7ef22e1c2d95494a8b03c5
3
+ size 1002561
tokenizer_config.json ADDED
@@ -0,0 +1,95 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_bos_token": false,
3
+ "add_eos_token": false,
4
+ "added_tokens_decoder": {
5
+ "0": {
6
+ "content": "<unk>",
7
+ "lstrip": false,
8
+ "normalized": true,
9
+ "rstrip": false,
10
+ "single_word": true,
11
+ "special": true
12
+ },
13
+ "1": {
14
+ "content": "<s>",
15
+ "lstrip": false,
16
+ "normalized": true,
17
+ "rstrip": false,
18
+ "single_word": false,
19
+ "special": true
20
+ },
21
+ "2": {
22
+ "content": "</s>",
23
+ "lstrip": false,
24
+ "normalized": true,
25
+ "rstrip": false,
26
+ "single_word": true,
27
+ "special": true
28
+ },
29
+ "64000": {
30
+ "content": "<|CLS|>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "64001": {
38
+ "content": "<|SEP|>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "64002": {
46
+ "content": "<|EOD|>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "64003": {
54
+ "content": "<|MASK|>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
+ },
61
+ "64004": {
62
+ "content": "<|PAD|>",
63
+ "lstrip": false,
64
+ "normalized": false,
65
+ "rstrip": false,
66
+ "single_word": false,
67
+ "special": true
68
+ }
69
+ },
70
+ "additional_special_tokens": [
71
+ "<|CLS|>",
72
+ "<|SEP|>",
73
+ "<|EOD|>",
74
+ "<|MASK|>",
75
+ "<|PAD|>"
76
+ ],
77
+ "auto_map": {
78
+ "AutoTokenizer": [
79
+ "DewEfresh/neo_7b--tokenization_neo.NEOTokenizer",
80
+ null
81
+ ]
82
+ },
83
+ "bos_token": "<s>",
84
+ "chat_template": "{% set system_message = 'You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe. Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.\\n\\nIf a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don\\'t know the answer to a question, please don\\'t share false information.' %}{% if messages[0]['role'] == 'system' %}{% set system_message = messages[0]['content'] %}{% endif %}{% for message in messages %}{% set content = message['content'] %}{% if loop.index0 == 0 and system_message is defined %}{% set content = '<<SYS>>\\n' + system_message + '\\n<</SYS>>\\n\\n' + message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ '<s>' + '[INST] ' + content + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ content + '</s>' }}{% endif %}{% endfor %}",
85
+ "clean_up_tokenization_spaces": false,
86
+ "eos_token": "</s>",
87
+ "model_max_length": 4096,
88
+ "pad_token": "<unk>",
89
+ "padding_side": "right",
90
+ "sp_model_kwargs": {},
91
+ "split_special_tokens": false,
92
+ "tokenizer_class": "NEOTokenizer",
93
+ "unk_token": "<unk>",
94
+ "use_fast": false
95
+ }