paloalma commited on
Commit
8c94126
1 Parent(s): 5ef8285

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +17 -0
  2. config.json +30 -0
  3. mergekit_config.yml +30 -0
  4. merges.txt +0 -0
  5. model-00001-of-00082.safetensors +3 -0
  6. model-00002-of-00082.safetensors +3 -0
  7. model-00003-of-00082.safetensors +3 -0
  8. model-00004-of-00082.safetensors +3 -0
  9. model-00005-of-00082.safetensors +3 -0
  10. model-00006-of-00082.safetensors +3 -0
  11. model-00007-of-00082.safetensors +3 -0
  12. model-00008-of-00082.safetensors +3 -0
  13. model-00009-of-00082.safetensors +3 -0
  14. model-00010-of-00082.safetensors +3 -0
  15. model-00011-of-00082.safetensors +3 -0
  16. model-00012-of-00082.safetensors +3 -0
  17. model-00013-of-00082.safetensors +3 -0
  18. model-00014-of-00082.safetensors +3 -0
  19. model-00015-of-00082.safetensors +3 -0
  20. model-00016-of-00082.safetensors +3 -0
  21. model-00017-of-00082.safetensors +3 -0
  22. model-00018-of-00082.safetensors +3 -0
  23. model-00019-of-00082.safetensors +3 -0
  24. model-00020-of-00082.safetensors +3 -0
  25. model-00021-of-00082.safetensors +3 -0
  26. model-00022-of-00082.safetensors +3 -0
  27. model-00023-of-00082.safetensors +3 -0
  28. model-00024-of-00082.safetensors +3 -0
  29. model-00025-of-00082.safetensors +3 -0
  30. model-00026-of-00082.safetensors +3 -0
  31. model-00027-of-00082.safetensors +3 -0
  32. model-00028-of-00082.safetensors +3 -0
  33. model-00029-of-00082.safetensors +3 -0
  34. model-00030-of-00082.safetensors +3 -0
  35. model-00031-of-00082.safetensors +3 -0
  36. model-00032-of-00082.safetensors +3 -0
  37. model-00033-of-00082.safetensors +3 -0
  38. model-00034-of-00082.safetensors +3 -0
  39. model-00035-of-00082.safetensors +3 -0
  40. model-00036-of-00082.safetensors +3 -0
  41. model-00037-of-00082.safetensors +3 -0
  42. model-00038-of-00082.safetensors +3 -0
  43. model-00039-of-00082.safetensors +3 -0
  44. model-00040-of-00082.safetensors +3 -0
  45. model-00041-of-00082.safetensors +3 -0
  46. model-00042-of-00082.safetensors +3 -0
  47. model-00043-of-00082.safetensors +3 -0
  48. model-00044-of-00082.safetensors +3 -0
  49. model-00045-of-00082.safetensors +3 -0
  50. model-00046-of-00082.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ tags:
4
+ - merge
5
+ - mergekit
6
+ - lazymergekit
7
+ - davidkim205/Rhea-72b-v0.5
8
+ - abacusai/Smaug-72B-v0.1
9
+ ---
10
+
11
+ # TW3-JRGL-v3
12
+
13
+ TW3-JRGL-v3 is a merge of the following models using [mergekit](https://github.com/cg123/mergekit):
14
+ * [davidkim205/Rhea-72b-v0.5](https://huggingface.co/davidkim205/Rhea-72b-v0.5)
15
+ * [abacusai/Smaug-72B-v0.1](https://huggingface.co/abacusai/Smaug-72B-v0.1)
16
+
17
+ ## 🧩 Configuration
config.json ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "davidkim205/Rhea-72b-v0.5",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": true,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 1,
9
+ "eos_token_id": 151643,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 8192,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 24576,
14
+ "max_position_embeddings": 32768,
15
+ "model_type": "llama",
16
+ "num_attention_heads": 64,
17
+ "num_hidden_layers": 80,
18
+ "num_key_value_heads": 64,
19
+ "pad_token_id": 151643,
20
+ "pretraining_tp": 1,
21
+ "rms_norm_eps": 1e-06,
22
+ "rope_scaling": null,
23
+ "rope_theta": 1000000,
24
+ "seq_length": 32768,
25
+ "tie_word_embeddings": false,
26
+ "torch_dtype": "bfloat16",
27
+ "transformers_version": "4.39.3",
28
+ "use_cache": true,
29
+ "vocab_size": 152064
30
+ }
mergekit_config.yml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_model: davidkim205/Rhea-72b-v0.5
2
+ dtype: bfloat16
3
+ merge_method: slerp
4
+ parameters:
5
+ t:
6
+ - filter: self_attn
7
+ value:
8
+ - 0
9
+ - 0.5
10
+ - 0.3
11
+ - 0.7
12
+ - 1
13
+ - filter: mlp
14
+ value:
15
+ - 1
16
+ - 0.5
17
+ - 0.7
18
+ - 0.3
19
+ - 0
20
+ - value: 0.5
21
+ slices:
22
+ - sources:
23
+ - layer_range:
24
+ - 0
25
+ - 80
26
+ model: davidkim205/Rhea-72b-v0.5
27
+ - layer_range:
28
+ - 0
29
+ - 80
30
+ model: abacusai/Smaug-72B-v0.1
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model-00001-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1aa619fc57e556b10c1fcfb5c1ef908be156450c312e6bcd6de6baf66ba93aa
3
+ size 1879164616
model-00002-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c34db1e04e4ee00d58c91d63896a8141a1232bec0eb2f2f99ce65b855678962
3
+ size 402703024
model-00003-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fa1a10feeab788c76005956249f06f5be60675a35069fdde009ceea4e5574ae
3
+ size 2491416720
model-00004-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c98d30f323e67d68b81920e502ad6a341eb72a98670cb4dd5bd1f65b07dec87b
3
+ size 1879164616
model-00005-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4565403fda6b1c51ce0f84699e05a1494e0a45e387220471053940040577464
3
+ size 1879164608
model-00006-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c54d21b47d6108c6856a402f32b07e96cdcf39a3f6ce5e3763d545318af45c3e
3
+ size 1610646216
model-00007-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77ae7e645d2365510c7a7463753f852b8ddf80bc2b9851fac8a5210ed432ea89
3
+ size 1744930280
model-00008-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c20636827a86ba04a498fe009b3de1c7194c300548ea46882f8c829c2834be51
3
+ size 1744930280
model-00009-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50fe9dbd9c7a4b040dfbe222b4ae8969720fc2d0c4a3c85f4a1136227fdc0430
3
+ size 1879131376
model-00010-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5a27df72b5d63753c039e3966b1d65fe6babe0da773909206dfc6ff25a8386c
3
+ size 1879148128
model-00011-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b479e8e92466a6b5d226fe5105436c3b43539e70f1c31cf6f44462691df6ecce
3
+ size 1879164616
model-00012-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30ec100626c74d113e7076ae1af96869de83d5bc90147fbcc51d399381d5c790
3
+ size 1610712664
model-00013-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da80bc929bd03725a6fc2a0252f16e52e9ad67c2489366d5bfb588347511e39c
3
+ size 1744930288
model-00014-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:430fff64ab1496ea0a379d7ba12517caa5cd95d7a2e2918a4689d1c5807b42b8
3
+ size 1879214112
model-00015-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40fbfbc183146026b8ceaeb259718c755c55430ad768065aca4d497b89d8ab4d
3
+ size 1879148136
model-00016-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0e6aab4f8429f361c084facea5fff49a2c66a1a66567ed881b575f721d07bf2
3
+ size 1879164632
model-00017-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1371224310cb5320c08cf34f5803717b2cb25d93acb9dbd628d230fa309d5019
3
+ size 1610695936
model-00018-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09d01140eb55ad5f2c11b00d72112003f9e96adafd7b2b4fac53a6386de52aef
3
+ size 1744930288
model-00019-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da0df6d432d1ce6cfa62402dbf838d54cb27e4967654e1e90345c94e4a4f570e
3
+ size 1744930288
model-00020-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f772dd83cef6c1915a67133b4aae75b9bc52e093c7cded9b09a4e2f13b57f90
3
+ size 1610646216
model-00021-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:123838a9ef7ad1e952005cbd7c88c25273c17686a27d71be69341e7d4f96d393
3
+ size 1744930288
model-00022-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba9d9c312d463d47db83ff0857c00fc125599b0477bb2355ec0f248f60a66755
3
+ size 1744930288
model-00023-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eab3c0087e6316c01b57fa7e5a099c1c7624cfd442fc79daa272faa2c6039c38
3
+ size 1879181112
model-00024-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3309ec94e79dac73aaa8a70b0b381ef07ce5457763d900b9fc20623f4ff689ad
3
+ size 1879148128
model-00025-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8e16d577c8ae740535f7c3e4c4c0487081324a244e59d594915ce216b35c71b
3
+ size 1744930280
model-00026-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5ba1399d9553847b497b281443b2be7cd0f69b172781ec52f96edab42c4214a
3
+ size 1744897296
model-00027-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04afa2f75a90c48e3bcc90a23e57f41ab7c2b2f077f173661faf8c7cf08b2f2d
3
+ size 1744930288
model-00028-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1889cfe68fe8c09d6a365643858f21ea8dffb834f457e1be0c33e3b85d7143fd
3
+ size 1879247336
model-00029-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:418e5878b85e1888ba43e8e09aafb2f46a74f0ef9c2658105b3f611bfe8d82fb
3
+ size 1744930280
model-00030-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83ac7fd38cf3dd5916e63d9f918a94250889bb236657d1fcb72fd0029c48501a
3
+ size 1744930280
model-00031-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7f06f40b47ac65566f6c7173ecc889158244c2ca6bcbdcf98a8663921dc8b25
3
+ size 1879114896
model-00032-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb822faccc3dee197f24933c5a6a2678394c5a40d0f31750025e8deb909c7d57
3
+ size 1744930288
model-00033-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f9ac94afeb2444951df56b73e84864e835b6c1a4c9aae5a527159bb0db65dd7
3
+ size 1744930288
model-00034-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ebbac9cd5111bb38fc8e455b7f7dc11e05771a123d54ed4794721c2aad40ee6
3
+ size 1879147896
model-00035-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84e0b1285910f4434c93f5a7f2959ed862dd7c1d97928c02533b3a69352c3245
3
+ size 1879164632
model-00036-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d36213a06e51901c910dd393c67e5429063436c64d3ecd7ee6a5e0c1f6509715
3
+ size 1610695944
model-00037-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9ddfff2b53722124cb91717e23177e264b6f54f808ce2e58d8421d40be54110
3
+ size 1744897296
model-00038-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecd8564c95e5cb681967c040aae5c86ece47a4606fdec33b1c3ad1089818fe6c
3
+ size 1744930288
model-00039-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b07325f5c85f5e3503a8163f3814a35c47090bcce883411e8196ede358696543
3
+ size 1879181112
model-00040-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7b864b230b60d754eb354f06f86cdf8d9b0c334dafabccb4ad7e10b2782f331
3
+ size 1879148136
model-00041-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c11fcc495539e78a529a50b0f5fc9f1e76efb3627e79fe4a4da212f07871ab07
3
+ size 1879164632
model-00042-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09151e7a24ce60c458484a2c7f347ed320fc9d1978a4350ddf22dfcfd2e28960
3
+ size 1879164624
model-00043-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52c30be8105596ba059d13a8f534be0df8e49f3e6b74e5049317c479ebcbf09a
3
+ size 1744930288
model-00044-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c97d71ddcaa9a2d15b620f3a9352f1987dbe2f4633d240a6ef96788bd1dfa16a
3
+ size 1879214112
model-00045-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e136b4de7e848f53e4eff313b28d06524ee6e5e0d5cc49af230dca2da287a10
3
+ size 1879148128
model-00046-of-00082.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b79db05574e84a511f437a59c3ca1a30c4a98afddeb806eba0debf8199244cc
3
+ size 1744930280