athirdpath's picture
Create README.md
4f56cea
|
raw
history blame
431 Bytes

Recipe

merge_method: dare_ties

  • base_model: athirdpath/BigMistral-11b

  • model: athirdpath/DoublePivot-11b

    weight: [0.20, 0.34, 0.42, 0.53, 0.60] / density: 0.45

  • model: athirdpath/DoubleMaid-11b

    weight: [0.65, 0.51, 0.43, 0.32, 0.25] / density: [0.60, 0.54, 0.50, 0.48, 0.40]

  • model: athirdpath/BigMistral-11b-GLUED

    weight: 0.15 / density: 0.40

int8_mask: true

dtype: bfloat16