morriszms commited on
Commit
ac5ea0d
1 Parent(s): e50acec

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,15 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ notus-7b-v1-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ notus-7b-v1-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ notus-7b-v1-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ notus-7b-v1-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ notus-7b-v1-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ notus-7b-v1-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ notus-7b-v1-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ notus-7b-v1-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ notus-7b-v1-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ notus-7b-v1-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ notus-7b-v1-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ notus-7b-v1-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,211 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ datasets:
3
+ - argilla/ultrafeedback-binarized-preferences
4
+ language:
5
+ - en
6
+ base_model: argilla/notus-7b-v1
7
+ library_name: transformers
8
+ pipeline_tag: text-generation
9
+ tags:
10
+ - dpo
11
+ - rlaif
12
+ - preference
13
+ - ultrafeedback
14
+ - TensorBlock
15
+ - GGUF
16
+ license: mit
17
+ model-index:
18
+ - name: notus-7b-v1
19
+ results:
20
+ - task:
21
+ type: text-generation
22
+ name: Text Generation
23
+ dataset:
24
+ name: AI2 Reasoning Challenge (25-Shot)
25
+ type: ai2_arc
26
+ config: ARC-Challenge
27
+ split: test
28
+ args:
29
+ num_few_shot: 25
30
+ metrics:
31
+ - type: acc_norm
32
+ value: 0.6459044368600683
33
+ name: normalized accuracy
34
+ source:
35
+ url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json
36
+ name: Open LLM Leaderboard Results
37
+ - task:
38
+ type: text-generation
39
+ name: Text Generation
40
+ dataset:
41
+ name: HellaSwag (10-Shot)
42
+ type: hellaswag
43
+ split: validation
44
+ args:
45
+ num_few_shot: 10
46
+ metrics:
47
+ - type: acc_norm
48
+ value: 0.8478390758812986
49
+ name: normalized accuracy
50
+ source:
51
+ url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json
52
+ name: Open LLM Leaderboard Results
53
+ - task:
54
+ type: text-generation
55
+ name: Text Generation
56
+ dataset:
57
+ name: TruthfulQA (0-shot)
58
+ type: truthful_qa
59
+ config: multiple_choice
60
+ split: validation
61
+ args:
62
+ num_few_shot: 0
63
+ metrics:
64
+ - type: mc2
65
+ value: 0.5436768358952805
66
+ source:
67
+ url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json
68
+ name: Open LLM Leaderboard Results
69
+ - task:
70
+ type: text-generation
71
+ name: Text Generation
72
+ dataset:
73
+ name: MMLU (5-Shot)
74
+ type: cais/mmlu
75
+ config: all
76
+ split: test
77
+ args:
78
+ num_few_shot: 5
79
+ metrics:
80
+ - type: acc
81
+ value: 0.6303308230938872
82
+ name: accuracy
83
+ source:
84
+ url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json
85
+ name: Open LLM Leaderboard Results
86
+ - task:
87
+ type: text-generation
88
+ name: Text Generation
89
+ dataset:
90
+ name: GSM8k (5-shot)
91
+ type: gsm8k
92
+ config: main
93
+ split: test
94
+ args:
95
+ num_few_shot: 5
96
+ metrics:
97
+ - type: acc
98
+ value: 0.1516300227445034
99
+ name: accuracy
100
+ source:
101
+ url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json
102
+ name: Open LLM Leaderboard Results
103
+ - task:
104
+ type: text-generation
105
+ name: Text Generation
106
+ dataset:
107
+ name: Winogrande (5-shot)
108
+ type: winogrande
109
+ config: winogrande_xl
110
+ split: validation
111
+ args:
112
+ num_few_shot: 5
113
+ metrics:
114
+ - type: acc
115
+ value: 0.7940015785319653
116
+ name: accuracy
117
+ source:
118
+ url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json
119
+ name: Open LLM Leaderboard Results
120
+ - task:
121
+ type: text-generation
122
+ name: Text Generation
123
+ dataset:
124
+ name: AlpacaEval
125
+ type: tatsu-lab/alpaca_eval
126
+ metrics:
127
+ - type: tatsu-lab/alpaca_eval
128
+ value: 0.9142
129
+ name: win rate
130
+ source:
131
+ url: https://tatsu-lab.github.io/alpaca_eval/
132
+ - task:
133
+ type: text-generation
134
+ name: Text Generation
135
+ dataset:
136
+ name: MT-Bench
137
+ type: unknown
138
+ metrics:
139
+ - type: unknown
140
+ value: 7.3
141
+ name: score
142
+ source:
143
+ url: https://huggingface.co/spaces/lmsys/mt-bench
144
+ ---
145
+
146
+ <div style="width: auto; margin-left: auto; margin-right: auto">
147
+ <img src="https://i.imgur.com/jC7kdl8.jpeg" alt="TensorBlock" style="width: 100%; min-width: 400px; display: block; margin: auto;">
148
+ </div>
149
+ <div style="display: flex; justify-content: space-between; width: 100%;">
150
+ <div style="display: flex; flex-direction: column; align-items: flex-start;">
151
+ <p style="margin-top: 0.5em; margin-bottom: 0em;">
152
+ Feedback and support: TensorBlock's <a href="https://x.com/tensorblock_aoi">Twitter/X</a>, <a href="https://t.me/TensorBlock">Telegram Group</a> and <a href="https://x.com/tensorblock_aoi">Discord server</a>
153
+ </p>
154
+ </div>
155
+ </div>
156
+
157
+ ## argilla/notus-7b-v1 - GGUF
158
+
159
+ This repo contains GGUF format model files for [argilla/notus-7b-v1](https://huggingface.co/argilla/notus-7b-v1).
160
+
161
+ The files were quantized using machines provided by [TensorBlock](https://tensorblock.co/), and they are compatible with llama.cpp as of [commit b4011](https://github.com/ggerganov/llama.cpp/commit/a6744e43e80f4be6398fc7733a01642c846dce1d).
162
+
163
+ ## Prompt template
164
+
165
+ ```
166
+ <|system|>
167
+ {system_prompt}</s>
168
+ <|user|>
169
+ {prompt}</s>
170
+ <|assistant|>
171
+ ```
172
+
173
+ ## Model file specification
174
+
175
+ | Filename | Quant type | File Size | Description |
176
+ | -------- | ---------- | --------- | ----------- |
177
+ | [notus-7b-v1-Q2_K.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q2_K.gguf) | Q2_K | 2.532 GB | smallest, significant quality loss - not recommended for most purposes |
178
+ | [notus-7b-v1-Q3_K_S.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q3_K_S.gguf) | Q3_K_S | 2.947 GB | very small, high quality loss |
179
+ | [notus-7b-v1-Q3_K_M.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q3_K_M.gguf) | Q3_K_M | 3.277 GB | very small, high quality loss |
180
+ | [notus-7b-v1-Q3_K_L.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q3_K_L.gguf) | Q3_K_L | 3.560 GB | small, substantial quality loss |
181
+ | [notus-7b-v1-Q4_0.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q4_0.gguf) | Q4_0 | 3.827 GB | legacy; small, very high quality loss - prefer using Q3_K_M |
182
+ | [notus-7b-v1-Q4_K_S.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q4_K_S.gguf) | Q4_K_S | 3.856 GB | small, greater quality loss |
183
+ | [notus-7b-v1-Q4_K_M.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q4_K_M.gguf) | Q4_K_M | 4.068 GB | medium, balanced quality - recommended |
184
+ | [notus-7b-v1-Q5_0.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q5_0.gguf) | Q5_0 | 4.654 GB | legacy; medium, balanced quality - prefer using Q4_K_M |
185
+ | [notus-7b-v1-Q5_K_S.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q5_K_S.gguf) | Q5_K_S | 4.654 GB | large, low quality loss - recommended |
186
+ | [notus-7b-v1-Q5_K_M.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q5_K_M.gguf) | Q5_K_M | 4.779 GB | large, very low quality loss - recommended |
187
+ | [notus-7b-v1-Q6_K.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q6_K.gguf) | Q6_K | 5.534 GB | very large, extremely low quality loss |
188
+ | [notus-7b-v1-Q8_0.gguf](https://huggingface.co/tensorblock/notus-7b-v1-GGUF/tree/main/notus-7b-v1-Q8_0.gguf) | Q8_0 | 7.167 GB | very large, extremely low quality loss - not recommended |
189
+
190
+
191
+ ## Downloading instruction
192
+
193
+ ### Command line
194
+
195
+ Firstly, install Huggingface Client
196
+
197
+ ```shell
198
+ pip install -U "huggingface_hub[cli]"
199
+ ```
200
+
201
+ Then, downoad the individual model file the a local directory
202
+
203
+ ```shell
204
+ huggingface-cli download tensorblock/notus-7b-v1-GGUF --include "notus-7b-v1-Q2_K.gguf" --local-dir MY_LOCAL_DIR
205
+ ```
206
+
207
+ If you wanna download multiple model files with a pattern (e.g., `*Q4_K*gguf`), you can try:
208
+
209
+ ```shell
210
+ huggingface-cli download tensorblock/notus-7b-v1-GGUF --local-dir MY_LOCAL_DIR --local-dir-use-symlinks False --include='*Q4_K*gguf'
211
+ ```
notus-7b-v1-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:971f0c38df64f6193310bbf13e448589b99d01d9bfa742179fbf7784743f7fdc
3
+ size 2719243264
notus-7b-v1-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73e8aacf15a54399dc4f03d190d90362a0e717f24cdb3d590b3095a45052a7c8
3
+ size 3822025728
notus-7b-v1-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c38f322a65ab3b6116044b109d72c89e6fcdead6535aae13e988bba2638c6494
3
+ size 3518987264
notus-7b-v1-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7193f17618c7b52e605024627ac3ab1a3615c0fcce6d996f67d687f1079c4eff
3
+ size 3164568576
notus-7b-v1-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c66b1b77af8d0acdba7c8011866b7dc280ce37f06fbd0768db2678071b38e712
3
+ size 4108917760
notus-7b-v1-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:311a1033332c34b7dbfc99a29206f04adac224b3fa359d04dce51ad07e69df31
3
+ size 4368440320
notus-7b-v1-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adf230ebbe490597f31779ad95b576abb8f5f3fe7d6b3055e22c6fe689d38530
3
+ size 4140375040
notus-7b-v1-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ba75a39dc01b52bff8f978141cb1e9621eb8f41fa6fabb8c95d5c2b7f26653b
3
+ size 4997716992
notus-7b-v1-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46adc186681997e45c627b74cb2406eb99c36cadffb7ac5f4b9ebcc108e91aa3
3
+ size 5131410432
notus-7b-v1-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50607a90d7de55d076acbb7918e2979180b622580be3a39cc2900593f94d2d21
3
+ size 4997716992
notus-7b-v1-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc3296f6acda4cd4f0ff83ea2b0e30afc34c9ae97be366b760d5521699635c97
3
+ size 5942066176
notus-7b-v1-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951ef5c8343052015a964c008d5f07da3dd2344a02a947f69e488a980ba320b4
3
+ size 7695858688