Update preset.json
Browse files- preset.json +25 -22
preset.json
CHANGED
@@ -1,35 +1,38 @@
|
|
1 |
{
|
2 |
-
"name": "Biggie SmoLlm
|
|
|
3 |
"load_params": {
|
4 |
-
"n_ctx":
|
5 |
"n_batch": 512,
|
6 |
"n_gpu_layers": 0,
|
7 |
-
"use_mlock":
|
8 |
-
"
|
9 |
-
"
|
10 |
-
"seed": -1,
|
11 |
"f16_kv": false,
|
12 |
-
"
|
13 |
-
"
|
14 |
-
"key_type": "q8_0",
|
15 |
-
"value_type": "q8_0"
|
16 |
-
}
|
17 |
},
|
18 |
"inference_params": {
|
19 |
"n_threads": 1,
|
20 |
"n_predict": 1024,
|
21 |
-
"top_k":
|
22 |
"top_p": 0.85,
|
23 |
"temperature": 1.5,
|
24 |
-
"repeat_penalty": 1.
|
25 |
"min_p": 0.3,
|
26 |
-
"
|
27 |
-
"
|
28 |
-
"
|
29 |
-
|
30 |
-
|
31 |
-
"
|
32 |
-
"
|
33 |
-
"
|
|
|
|
|
|
|
|
|
|
|
|
|
34 |
}
|
35 |
-
}
|
|
|
1 |
{
|
2 |
+
"name": "Biggie SmoLlm Q8_0",
|
3 |
+
"model_path": "biggie_groked_int8_q8_0.gguf",
|
4 |
"load_params": {
|
5 |
+
"n_ctx": 2048,
|
6 |
"n_batch": 512,
|
7 |
"n_gpu_layers": 0,
|
8 |
+
"use_mlock": true,
|
9 |
+
"rope_freq_base": 10000,
|
10 |
+
"rope_freq_scale": 1.0,
|
|
|
11 |
"f16_kv": false,
|
12 |
+
"cache_type_k": "q8_0", // 🔑 Equivalent to -ctk q8_0
|
13 |
+
"cache_type_v": "q8_0"
|
|
|
|
|
|
|
14 |
},
|
15 |
"inference_params": {
|
16 |
"n_threads": 1,
|
17 |
"n_predict": 1024,
|
18 |
+
"top_k": 40,
|
19 |
"top_p": 0.85,
|
20 |
"temperature": 1.5,
|
21 |
+
"repeat_penalty": 1.1,
|
22 |
"min_p": 0.3,
|
23 |
+
"mirostat": 0,
|
24 |
+
"mirostat_tau": 5,
|
25 |
+
"mirostat_eta": 0.1,
|
26 |
+
"tfs_z": 1,
|
27 |
+
"typical_p": 1,
|
28 |
+
"presence_penalty": 0,
|
29 |
+
"frequency_penalty": 0,
|
30 |
+
"pre_prompt": "You are a NASA JPL Scientist.",
|
31 |
+
"pre_prompt_suffix": "\n",
|
32 |
+
"pre_prompt_prefix": "",
|
33 |
+
"input_prefix": "<|im_start|>Human: ",
|
34 |
+
"input_suffix": "\n",
|
35 |
+
"antiprompt": ["Human:"],
|
36 |
+
"stop_sequences": []
|
37 |
}
|
38 |
+
}
|