Text Generation
Transformers
Safetensors
English
Chinese
llama
conversational
Inference Endpoints
text-generation-inference
File size: 382 Bytes
86c6605
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
models:
  - model: /cephfs/panwenbo/work/models/Faro-9B-200K
  - model: /cephfs/panwenbo/work/models/Faro-Yi-9B-DPO
merge_method: slerp
base_model: /cephfs/panwenbo/work/models/Faro-9B-200K
parameters:
  t:
    - filter: self_attn
      value: [0, 0.5, 0.3, 0.7, 1]
    - filter: mlp
      value: [1, 0.5, 0.7, 0.3, 0]
    - value: 0.5 # fallback for rest of tensors
dtype: float16