Update README.md
Browse files
README.md
CHANGED
@@ -28,7 +28,7 @@ Full offload possible on 24GB VRAM with a decent context size.
|
|
28 |
- Lower quality : IQ2_XXS SOTA
|
29 |
|
30 |
Full offload possible on 16GB VRAM with a decent context size.
|
31 |
-
- IQ1_S
|
32 |
|
33 |
---
|
34 |
|
@@ -184,4 +184,39 @@ Also, for information, another requant from a Q4_K_S orphan of a 32k finetune of
|
|
184 |
- WinterGoddess-1.4x-limarpv3-70B-L2-32k-Requant-AR-b1952-iMat-c32_ch2500-Q3_K_XS.gguf,-,Winogrande,77.8216,,1267,2024-01-23 05:40:00,PEC2.5,70b,Llama_2,4096,,,GGUF,Mishima,Nexesenex,
|
185 |
- WinterGoddess-1.4x-limarpv3-70B-L2-32k-Requant-AR-b1952-iMat-c32_ch2500-Q3_K_XS.gguf,-,wikitext,4.2327,512,512,2024-01-23 01:40:00,PEC2.5,70b,Llama_2,4096,,,GGUF,Mishima,Nexesenex,
|
186 |
|
187 |
-
Draw your own conclusions as well !
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
28 |
- Lower quality : IQ2_XXS SOTA
|
29 |
|
30 |
Full offload possible on 16GB VRAM with a decent context size.
|
31 |
+
- IQ1_S (prefer v3 to v2, v2 to v1, etc)
|
32 |
|
33 |
---
|
34 |
|
|
|
184 |
- WinterGoddess-1.4x-limarpv3-70B-L2-32k-Requant-AR-b1952-iMat-c32_ch2500-Q3_K_XS.gguf,-,Winogrande,77.8216,,1267,2024-01-23 05:40:00,PEC2.5,70b,Llama_2,4096,,,GGUF,Mishima,Nexesenex,
|
185 |
- WinterGoddess-1.4x-limarpv3-70B-L2-32k-Requant-AR-b1952-iMat-c32_ch2500-Q3_K_XS.gguf,-,wikitext,4.2327,512,512,2024-01-23 01:40:00,PEC2.5,70b,Llama_2,4096,,,GGUF,Mishima,Nexesenex,
|
186 |
|
187 |
+
Draw your own conclusions as well !
|
188 |
+
|
189 |
+
----
|
190 |
+
|
191 |
+
New quants IQ1 :
|
192 |
+
|
193 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,Hellaswag,24.25,400,,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
194 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,Hellaswag,22.5,1000,,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
195 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,Arc-Challenge,25.08361204,,299,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
196 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,Arc-Easy,24.56140351,,570,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
197 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,MMLU,24.92012780,,313,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
198 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,Thruthful-QA,19.33904529,,817,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
199 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,Winogrande,50.8287,,1267,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
200 |
+
- miqu-1-70b-Requant-b2116-iMat-c32_ch400-IQ1_S.gguf,-,wikitext,117089.7230,512,512,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,327
|
201 |
+
|
202 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,Hellaswag,76,400,,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
203 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,Hellaswag,76.3,1000,,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
204 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,Arc-Challenge,45.15050167,,299,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
205 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,Arc-Easy,67.54385965,,570,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
206 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,MMLU,39.93610224,,313,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
207 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,Thruthful-QA,29.37576499,,817,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
208 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,Winogrande,72.6914,,1267,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
209 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,wikitext,7.0861,512,512,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
210 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,wikitext,5.8372,4096,4096,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
211 |
+
- miqu-1-70b-Requant-b2128-iMat-c32_ch400-IQ1_S_v2.gguf,-,wikitext,5.7746,4096,4096,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
212 |
+
|
213 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,Hellaswag,78.75,,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
214 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,Hellaswag,78.1,1000,,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
215 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,Arc-Challenge,45.15050167,,299,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
216 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,Arc-Easy,70.70175439,,570,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
217 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,MMLU,38.97763578,,313,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
218 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,Thruthful-QA,33.29253366,,817,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
219 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,Winogrande,72.2178,,1267,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
220 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,wikitext,6.7606,512,512,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
221 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,wikitext,5.5886,4096,4096,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|
222 |
+
- miqu-1-70b-Requant-b2131-iMat-c32_ch400-IQ1_S_v3.gguf,-,wikitext,5.5291,4096,4096,2024-02-12 00:00:00,,70b,Mistral_Medium,32768,,,GGUF,Miqudev,Nexesenex,
|