File size: 298 Bytes
49610ec
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12

merge_method: sce
base_model: Qwen/Qwen2.5-14B
models:
  - model: Qwen/Qwen2.5-14B-Instruct-1M
  - model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
  - model: Qwen/Qwen2.5-Coder-14B-Instruct
parameters:
  select_topk: 0.75  # retain top 75% high-variance parameters
dtype: bfloat16
normalize: true