Swallow-MoE-2x13B-v0.1 / mergekit_moe_config.yml
Aratako
model upload
b780a2a
raw
history blame contribute delete
No virus
248 Bytes
base_model: ./Superswallow-13b-v0.2
gate_mode: random
dtype: bfloat16
experts:
- source_model: ./Superswallow-13b-v0.2
positive_prompts: []
- source_model: ./Swallow-13b-instruct-hf
positive_prompts: []
tokenizer_source: union