paloalma commited on
Commit
6044ecf
1 Parent(s): 81edb48

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. config.json +30 -0
  3. mergekit_config.yml +30 -0
  4. merges.txt +0 -0
  5. model-00001-of-00082.safetensors +3 -0
  6. model-00002-of-00082.safetensors +3 -0
  7. model-00003-of-00082.safetensors +3 -0
  8. model-00004-of-00082.safetensors +3 -0
  9. model-00005-of-00082.safetensors +3 -0
  10. model-00006-of-00082.safetensors +3 -0
  11. model-00007-of-00082.safetensors +3 -0
  12. model-00008-of-00082.safetensors +3 -0
  13. model-00009-of-00082.safetensors +3 -0
  14. model-00010-of-00082.safetensors +3 -0
  15. model-00011-of-00082.safetensors +3 -0
  16. model-00012-of-00082.safetensors +3 -0
  17. model-00013-of-00082.safetensors +3 -0
  18. model-00014-of-00082.safetensors +3 -0
  19. model-00015-of-00082.safetensors +3 -0
  20. model-00016-of-00082.safetensors +3 -0
  21. model-00017-of-00082.safetensors +3 -0
  22. model-00018-of-00082.safetensors +3 -0
  23. model-00019-of-00082.safetensors +3 -0
  24. model-00020-of-00082.safetensors +3 -0
  25. model-00021-of-00082.safetensors +3 -0
  26. model-00022-of-00082.safetensors +3 -0
  27. model-00023-of-00082.safetensors +3 -0
  28. model-00024-of-00082.safetensors +3 -0
  29. model-00025-of-00082.safetensors +3 -0
  30. model-00026-of-00082.safetensors +3 -0
  31. model-00027-of-00082.safetensors +3 -0
  32. model-00028-of-00082.safetensors +3 -0
  33. model-00029-of-00082.safetensors +3 -0
  34. model-00030-of-00082.safetensors +3 -0
  35. model-00031-of-00082.safetensors +3 -0
  36. model-00032-of-00082.safetensors +3 -0
  37. model-00033-of-00082.safetensors +3 -0
  38. model-00034-of-00082.safetensors +3 -0
  39. model-00035-of-00082.safetensors +3 -0
  40. model-00036-of-00082.safetensors +3 -0
  41. model-00037-of-00082.safetensors +3 -0
  42. model-00038-of-00082.safetensors +3 -0
  43. model-00039-of-00082.safetensors +3 -0
  44. model-00040-of-00082.safetensors +3 -0
  45. model-00041-of-00082.safetensors +3 -0
  46. model-00042-of-00082.safetensors +3 -0
  47. model-00043-of-00082.safetensors +3 -0
  48. model-00044-of-00082.safetensors +3 -0
  49. model-00045-of-00082.safetensors +3 -0
  50. model-00046-of-00082.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - abacusai/Smaug-72B-v0.1
8
+ - davidkim205/Rhea-72b-v0.5
9
+ ---
10
+
11
+ # ECE-TW3-JRGL-VHF2
12
+
13
+ ECE-TW3-JRGL-VHF2 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [abacusai/Smaug-72B-v0.1](https://huggingface.co/abacusai/Smaug-72B-v0.1)
15
+ * [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
16
+
17
+ ## 🧩 Configuration
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "davidkim205/Rhea-72b-v0.5",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": true,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 151643,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 64,
19
+ "pad_token_id": 151643,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": null,
23
+ "rope_theta": 1000000,
24
+ "seq_length": 32768,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.39.3",
28
+ "use_cache": true,
29
+ "vocab_size": 152064
30
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: davidkim205/Rhea-72b-v0.5
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.8
10
+ - 0.8
11
+ - 0.8
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.2
17
+ - 0.2
18
+ - 0.2
19
+ - 0
20
+ - value: 0.2
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: abacusai/Smaug-72B-v0.1
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: davidkim205/Rhea-72b-v0.5
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:990db56e09d96bfd364a04073f2353756ca794632486f49d16372870774f986d
3
+ size 1879164616
model-00002-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c34db1e04e4ee00d58c91d63896a8141a1232bec0eb2f2f99ce65b855678962
3
+ size 402703024
model-00003-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fa1a10feeab788c76005956249f06f5be60675a35069fdde009ceea4e5574ae
3
+ size 2491416720
model-00004-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdc660c61a57f3ff06dc5263108b21219a4840d1a4f4dd603c5a252bba35d7a1
3
+ size 1879164616
model-00005-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2581ae59e907bcecf39069c818c85bd62da7085e0de700b97ee141fac87c9630
3
+ size 1879164608
model-00006-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c49256b1dc356f0985ff9e2867eeed804bdddd41759f60edffd503e6dbefa8d9
3
+ size 1610646216
model-00007-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28e7cca0be25409e392f73e8bf7ded581200a6e19266698fa451f797773e226c
3
+ size 1744930280
model-00008-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d1122287bbb9c345bba01b0c805f1af4d3e49783e577ddf2bd291297fb79782
3
+ size 1744930280
model-00009-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5546a8ee208f49619e691de8ada7302b64b093c99c695e1b52574e54663102d2
3
+ size 1879131376
model-00010-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a159f5f134d1fef40147fc542a5a480f58fde67387840417d7c21d4c5d15180e
3
+ size 1879148128
model-00011-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dba63600fb2d4154208f66e8a378308f0b3936b3a6f8ff077fb5c839f02acf6f
3
+ size 1879164616
model-00012-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57f385c772a1f610c18cb9e7933f5c73bd4ca75f908b0b43a0c813434be352bf
3
+ size 1610712664
model-00013-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83acdf29dffc1bf7729af89f0985d5e23f7448b98387051f7c21f262f114ee7f
3
+ size 1744930288
model-00014-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3eef3bb59f5e49f4edd7e66c5021e7de5455297a6aafad3e9f83ba960bbc0164
3
+ size 1879214112
model-00015-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dec9899de0847d548bba9ec697f25b3dbfb66d7a5346ef3b36f3c7d3a10a63d6
3
+ size 1879148136
model-00016-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:42d94d02eb9e436e48298b9921ccb95ad77bef8e0cf8ed9c097a4a48651392e5
3
+ size 1879164632
model-00017-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb972701c4fcaeaa496094b10218ca725314b7db9d63af8a4cd79f39187d7eea
3
+ size 1610695936
model-00018-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:390318573b31d18dadddfc4bedd4301c4653a9ac88f6c5eb33fe6afea5ef23aa
3
+ size 1744930288
model-00019-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a779e6949fdc0f47bbe5115aa6276c1488632435c1915f5ed2165ba0e2bd655
3
+ size 1744930288
model-00020-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba053453b1c3e15318fcda84392d98a054abe807103ded6dcbda265e987409de
3
+ size 1610646216
model-00021-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c02eea15c1dacb65bcd2f527e80b9c276c76f79b4a765c96faedf42f91559b08
3
+ size 1744930288
model-00022-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a5c97c8114b31dce3cdff9a9fb727c4b6d673e2af522bb9609731e3aea1c532
3
+ size 1744930288
model-00023-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da3f9c1dac0f016ff4f5a0f4acf3e4d0c161c4f25c461b4abc528df5c02194ee
3
+ size 1879181112
model-00024-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9425e9b30ac5de5e4f1ed8778cddcc41ada614b5260594cb947208c4fea966c
3
+ size 1879148128
model-00025-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b72ef762c70fb72d38eb9f36d8fde35a6454536cfb7ae2d4363e78953d33b093
3
+ size 1744930280
model-00026-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6260eead2095bd284e29c99879bdf4cf6f2db6b12a7feb1efe69efbca40d95a9
3
+ size 1744897296
model-00027-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9beaa999d26516848067102492e952fddc9c0fec165614991940b9cf8b9837a1
3
+ size 1744930288
model-00028-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9be02099be2dace5d103e85735276c514a581441dd0e472173d4ce14a2ee49b
3
+ size 1879247336
model-00029-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a35eb343929cf6c8ad8411dbd1eedbf179c194f793bb9e7943c6a1792200569
3
+ size 1744930280
model-00030-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e39e2587b62ba233531bf45b9a2ddef18dbab20c24cfbcefdd06d8ca0f47f306
3
+ size 1744930280
model-00031-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e480f6f8fd94d8ef7f77d648da2ffe2291c02e96536865e0065bae0d2e0e059
3
+ size 1879114896
model-00032-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:921b3a3a42dfdb9766d54c7b9f61e77282a9ab38c9578cfb7420f7d7f245a24f
3
+ size 1744930288
model-00033-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bc73259e5736d020a974395f0710892dd0a4c0c59f0665b68bd0069694c678a
3
+ size 1744930288
model-00034-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6e2b094b8f127695b44dccfa7fa661ff03f2e1ec599e73fba242d8e9c33674d
3
+ size 1879147896
model-00035-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:022b3c30b9457fc6a9f45252c48b9d6406f673832f86bf7ee2c6f87611fbf3a4
3
+ size 1879164632
model-00036-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d55b8600609ae409313e2bab2083d310ce27de86dec1324a1baae51f5566c459
3
+ size 1610695944
model-00037-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9f646129c1ec2d9de4f0cbe0ffffe90adb4ca54257459802e2fadbc8a0e10c3
3
+ size 1744897296
model-00038-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb7e86d00cefa1c4a73c2dc926ce80cd95535d5c906fa9e10aefe7226951af8e
3
+ size 1744930288
model-00039-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5aabdc3c00ba599d5296496d8172d7ee351657f31ef7354e25d3aa3193d3568
3
+ size 1879181112
model-00040-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ebc8a8060219766fc793ca85533e0ce7ab239b27f25d103480d781a0ce5838f
3
+ size 1879148136
model-00041-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2c1e3bae2d170d285a5e1f406c62d7cc5aae5cc8bf8000f0ca5fed523a339dd
3
+ size 1879164632
model-00042-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2437ba81b397ce4f656b50940e13f5d404816140bbf42e58a1ee1de61aeabde6
3
+ size 1879164624
model-00043-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21fb492f88262f5974cd2cb26295d217412a2bbfcbb9d0c098685f73e65fd3a5
3
+ size 1744930288
model-00044-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8eeb7990f514f9fb5d6f3ccd8fe9d292d48c6bb528316d1983ee4cee82884ad
3
+ size 1879214112
model-00045-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ffec671128a64336aca861015c09ac8f0f633422d61d5ec415c2f5de2b0498a
3
+ size 1879148128
model-00046-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4a358f0ef4007cd3bdeb7bbdb3bf14382abec1ec3f1a6bd180b81c7cdff9cf7
3
+ size 1744930280