Lunzima's picture
Upload nqlsg-14b.yaml
9a81023 verified
name: NQLSG-Qwen2.5-14B-Base1
models:
- model: sthenno/tempesthenno-nuslerp-0124
- model: sthenno/tempesthenno-ppo-ckpt40
- model: sthenno-com/miscii-14b-1225
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0b3
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
- model: sometimesanotion/Lamarck-14B-v0.6
- model: sometimesanotion/Lamarck-14B-v0.7
- model: sometimesanotion/Qwen2.5-14B-Vimarckoso-v3
- model: sometimesanotion/Qwenvergence-14B-v11
- model: sometimesanotion/Qwenvergence-14B-v12-Prose-DS
- model: sometimesanotion/Qwenvergence-14B-v13-Prose-DS
base_model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
chat_template: auto
dtype: bfloat16
merge_method: ties
parameters:
weight: 1.0
density: 1.0
int8_mask: true
tokenizer:
source: union
---
name: NQLSG-Qwen2.5-14B-Base2
models:
- model: sthenno/tempesthenno-nuslerp-0124
- model: sthenno/tempesthenno-ppo-ckpt40
- model: sthenno-com/miscii-14b-1225
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0b3
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
- model: sometimesanotion/Lamarck-14B-v0.6
- model: sometimesanotion/Lamarck-14B-v0.7
- model: sometimesanotion/Qwen2.5-14B-Vimarckoso-v3
- model: sometimesanotion/Qwenvergence-14B-v11
- model: sometimesanotion/Qwenvergence-14B-v12-Prose-DS
- model: sometimesanotion/Qwenvergence-14B-v13-Prose-DS
base_model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
chat_template: auto
dtype: bfloat16
merge_method: sce
parameters:
int8_mask: true
tokenizer:
source: union
---
name: NQLSG-Qwen2.5-14B-Base3
models:
- model: sthenno/tempesthenno-nuslerp-0124
- model: sthenno/tempesthenno-ppo-ckpt40
- model: sthenno-com/miscii-14b-1225
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0b3
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
- model: sometimesanotion/Lamarck-14B-v0.6
- model: sometimesanotion/Lamarck-14B-v0.7
- model: sometimesanotion/Qwen2.5-14B-Vimarckoso-v3
- model: sometimesanotion/Qwenvergence-14B-v11
- model: sometimesanotion/Qwenvergence-14B-v12-Prose-DS
- model: sometimesanotion/Qwenvergence-14B-v13-Prose-DS
base_model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
chat_template: auto
dtype: bfloat16
merge_method: model_stock
parameters:
int8_mask: true
tokenizer:
source: union
---
name: NQLSG-Qwen2.5-14B-Base4
models:
- model: sthenno/tempesthenno-nuslerp-0124
- model: sthenno/tempesthenno-ppo-ckpt40
- model: sthenno-com/miscii-14b-1225
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0b3
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
- model: sometimesanotion/Lamarck-14B-v0.6
- model: sometimesanotion/Lamarck-14B-v0.7
- model: sometimesanotion/Qwen2.5-14B-Vimarckoso-v3
- model: sometimesanotion/Qwenvergence-14B-v11
- model: sometimesanotion/Qwenvergence-14B-v12-Prose-DS
- model: sometimesanotion/Qwenvergence-14B-v13-Prose-DS
base_model: sometimesanotion/Lamarck-14B-v0.6
chat_template: auto
dtype: bfloat16
merge_method: ties
parameters:
weight: 1.0
density: 1.0
int8_mask: true
tokenizer:
source: union
---
name: NQLSG-Qwen2.5-14B-Base5
models:
- model: sthenno/tempesthenno-nuslerp-0124
- model: sthenno/tempesthenno-ppo-ckpt40
- model: sthenno-com/miscii-14b-1225
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0b3
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
- model: sometimesanotion/Lamarck-14B-v0.6
- model: sometimesanotion/Lamarck-14B-v0.7
- model: sometimesanotion/Qwen2.5-14B-Vimarckoso-v3
- model: sometimesanotion/Qwenvergence-14B-v11
- model: sometimesanotion/Qwenvergence-14B-v12-Prose-DS
- model: sometimesanotion/Qwenvergence-14B-v13-Prose-DS
base_model: sometimesanotion/Lamarck-14B-v0.6
chat_template: auto
dtype: bfloat16
merge_method: sce
parameters:
int8_mask: true
tokenizer:
source: union
---
name: NQLSG-Qwen2.5-14B-Base6
models:
- model: sthenno/tempesthenno-nuslerp-0124
- model: sthenno/tempesthenno-ppo-ckpt40
- model: sthenno-com/miscii-14b-1225
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0b3
- model: jpacifico/Chocolatine-2-14B-Instruct-v2.0.3
- model: sometimesanotion/Lamarck-14B-v0.6
- model: sometimesanotion/Lamarck-14B-v0.7
- model: sometimesanotion/Qwen2.5-14B-Vimarckoso-v3
- model: sometimesanotion/Qwenvergence-14B-v11
- model: sometimesanotion/Qwenvergence-14B-v12-Prose-DS
- model: sometimesanotion/Qwenvergence-14B-v13-Prose-DS
base_model: sometimesanotion/Lamarck-14B-v0.6
chat_template: auto
dtype: bfloat16
merge_method: model_stock
parameters:
int8_mask: true
tokenizer:
source: union
---
name: NQLSG-Qwen2.5-14B-MegaFusion
models:
- model: NQLSG-Qwen2.5-14B-Base1
- model: NQLSG-Qwen2.5-14B-Base2
- model: NQLSG-Qwen2.5-14B-Base3
- model: NQLSG-Qwen2.5-14B-Base4
- model: NQLSG-Qwen2.5-14B-Base5
- model: NQLSG-Qwen2.5-14B-Base6
base_model: NQLSG-Qwen2.5-14B-Base5
chat_template: auto
dtype: bfloat16
merge_method: sce
parameters:
int8_mask: true
tokenizer:
source: union