Upload folder using huggingface_hub

Browse files

Files changed (7) hide show

README.md +20 -20
config.json +1 -1
mergekit_config.yml +14 -14
model-00001-of-00004.safetensors +1 -1
model-00002-of-00004.safetensors +1 -1
model-00003-of-00004.safetensors +1 -1
model-00004-of-00004.safetensors +1 -1

README.md CHANGED Viewed

@@ -1,8 +1,8 @@
 ---
 base_model:
-- MrRobotoAI/MrRoboto-ProLong-8b-v2g
-- MrRobotoAI/MrRoboto-ProLong-8b-v1n
-- MrRobotoAI/MrRoboto-ProLong-8b-v2e
 library_name: transformers
 tags:
 - mergekit
@@ -16,50 +16,50 @@ This is a merge of pre-trained language models created using [mergekit](https://
 ## Merge Details
 ### Merge Method
-This model was merged using the [TIES](https://arxiv.org/abs/2306.01708) merge method using [MrRobotoAI/MrRoboto-ProLong-8b-v1n](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v1n) as a base.
 ### Models Merged
 The following models were included in the merge:
-* [MrRobotoAI/MrRoboto-ProLong-8b-v2g](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2g)
-* [MrRobotoAI/MrRoboto-ProLong-8b-v2e](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2e)
 ### Configuration
 The following YAML configuration was used to produce this model:
 ```yaml
-merge_method: ties
 models:
-  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2e
     parameters:
       weight:
         - filter: v_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: o_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: up_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: gate_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: down_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - value: 1
-  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2g
     parameters:
       weight:
         - filter: v_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: o_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: up_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: gate_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: down_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - value: 0
-base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
 tokenizer_source: base
 dtype: bfloat16
 ```

 ---
 base_model:
+- MrRobotoAI/MrRoboto-ProLong-8b-v2k
+- MrRobotoAI/Thor-v1.4-8b-DARK-FICTION
+- MrRobotoAI/MrRoboto-ProLong-8b-v2h
 library_name: transformers
 tags:
 - mergekit
 ## Merge Details
 ### Merge Method
+This model was merged using the linear [DARE](https://arxiv.org/abs/2311.03099) merge method using [MrRobotoAI/MrRoboto-ProLong-8b-v2k](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2k) as a base.
 ### Models Merged
 The following models were included in the merge:
+* [MrRobotoAI/Thor-v1.4-8b-DARK-FICTION](https://huggingface.co/MrRobotoAI/Thor-v1.4-8b-DARK-FICTION)
+* [MrRobotoAI/MrRoboto-ProLong-8b-v2h](https://huggingface.co/MrRobotoAI/MrRoboto-ProLong-8b-v2h)
 ### Configuration
 The following YAML configuration was used to produce this model:
 ```yaml
+merge_method: dare_linear
 models:
+  - model: MrRobotoAI/Thor-v1.4-8b-DARK-FICTION
     parameters:
       weight:
         - filter: v_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: o_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: up_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: gate_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: down_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - value: 1
+  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2h
     parameters:
       weight:
         - filter: v_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: o_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: up_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: gate_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: down_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - value: 0
+base_model: MrRobotoAI/MrRoboto-ProLong-8b-v2k
 tokenizer_source: base
 dtype: bfloat16
 ```

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "MrRobotoAI/MrRoboto-ProLong-8b-v1n",
   "architectures": [
     "LlamaForCausalLM"
   ],

 {
+  "_name_or_path": "MrRobotoAI/MrRoboto-ProLong-8b-v2k",
   "architectures": [
     "LlamaForCausalLM"
   ],

mergekit_config.yml CHANGED Viewed

@@ -1,33 +1,33 @@
-merge_method: ties
 models:
-  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2e
     parameters:
       weight:
         - filter: v_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: o_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: up_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: gate_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - filter: down_proj
-          value: [0.15, 0.15, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.15, 0.15]
         - value: 1
-  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2g
     parameters:
       weight:
         - filter: v_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: o_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: up_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: gate_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - filter: down_proj
-          value: [0.85, 0.85, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.85, 0.85]
         - value: 0
-base_model: MrRobotoAI/MrRoboto-ProLong-8b-v1n
 tokenizer_source: base
 dtype: bfloat16

+merge_method: dare_linear
 models:
+  - model: MrRobotoAI/Thor-v1.4-8b-DARK-FICTION
     parameters:
       weight:
         - filter: v_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: o_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: up_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: gate_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - filter: down_proj
+          value: [0.25, 0.25, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.25, 0.25]
         - value: 1
+  - model: MrRobotoAI/MrRoboto-ProLong-8b-v2h
     parameters:
       weight:
         - filter: v_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: o_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: up_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: gate_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - filter: down_proj
+          value: [0.75, 0.75, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.5, 0.75, 0.75]
         - value: 0
+base_model: MrRobotoAI/MrRoboto-ProLong-8b-v2k
 tokenizer_source: base
 dtype: bfloat16

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:809be62669fd137bee689f27d4bd76263c6b9b108071b049dd91f19adcd9573d
 size 4953586384

 version https://git-lfs.github.com/spec/v1
+oid sha256:01369721bb73c919970a271c9b300f6a9dc80151a79d357bb809170234e769c5
 size 4953586384

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:68fbd16248bb797b6116978c6c1932d3ca70fd970d0553060961f4924e5ee7a8
 size 4999819336

 version https://git-lfs.github.com/spec/v1
+oid sha256:ee61ec15b9cc941be0896e4c392f98186da9d4e124af310f9fd97678e027c55c
 size 4999819336

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cea27cdf0b846a1e00e0ce476b43aab211d216232d949251b9f905f4d1fa352a
 size 4915916144

 version https://git-lfs.github.com/spec/v1
+oid sha256:0f2a5192d07a8be66835093a322f66d04fc9a6a0288acfc98cc77de880c35888
 size 4915916144

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:64b2772fd10f7173971faf5a5450d57fb6970b75d4b66ca187d67cd691888087
 size 1191234472

 version https://git-lfs.github.com/spec/v1
+oid sha256:1a8ff4c645398e0f65ede3055ad7e0c5263eed63bf5b416fac7095a8e56fddc8
 size 1191234472