Text Generation
Transformers
Safetensors
mixtral
Mixture of Experts
sharegpt
axolotl
conversational
text-generation-inference

Upload folder using huggingface_hub

#3
This view is limited to 50 files because it contains too many changes.  See the raw diff here.
Files changed (50) hide show
  1. added_tokens.json +4 -0
  2. config.json +31 -0
  3. generation_config.json +7 -0
  4. model-00001-of-00117.safetensors +3 -0
  5. model-00002-of-00117.safetensors +3 -0
  6. model-00003-of-00117.safetensors +3 -0
  7. model-00004-of-00117.safetensors +3 -0
  8. model-00005-of-00117.safetensors +3 -0
  9. model-00006-of-00117.safetensors +3 -0
  10. model-00007-of-00117.safetensors +3 -0
  11. model-00008-of-00117.safetensors +3 -0
  12. model-00009-of-00117.safetensors +3 -0
  13. model-00010-of-00117.safetensors +3 -0
  14. model-00011-of-00117.safetensors +3 -0
  15. model-00012-of-00117.safetensors +3 -0
  16. model-00013-of-00117.safetensors +3 -0
  17. model-00014-of-00117.safetensors +3 -0
  18. model-00015-of-00117.safetensors +3 -0
  19. model-00016-of-00117.safetensors +3 -0
  20. model-00017-of-00117.safetensors +3 -0
  21. model-00018-of-00117.safetensors +3 -0
  22. model-00019-of-00117.safetensors +3 -0
  23. model-00020-of-00117.safetensors +3 -0
  24. model-00021-of-00117.safetensors +3 -0
  25. model-00022-of-00117.safetensors +3 -0
  26. model-00023-of-00117.safetensors +3 -0
  27. model-00024-of-00117.safetensors +3 -0
  28. model-00025-of-00117.safetensors +3 -0
  29. model-00026-of-00117.safetensors +3 -0
  30. model-00027-of-00117.safetensors +3 -0
  31. model-00028-of-00117.safetensors +3 -0
  32. model-00029-of-00117.safetensors +3 -0
  33. model-00030-of-00117.safetensors +3 -0
  34. model-00031-of-00117.safetensors +3 -0
  35. model-00032-of-00117.safetensors +3 -0
  36. model-00033-of-00117.safetensors +3 -0
  37. model-00034-of-00117.safetensors +3 -0
  38. model-00035-of-00117.safetensors +3 -0
  39. model-00036-of-00117.safetensors +3 -0
  40. model-00037-of-00117.safetensors +3 -0
  41. model-00038-of-00117.safetensors +3 -0
  42. model-00039-of-00117.safetensors +3 -0
  43. model-00040-of-00117.safetensors +3 -0
  44. model-00041-of-00117.safetensors +3 -0
  45. model-00042-of-00117.safetensors +3 -0
  46. model-00043-of-00117.safetensors +3 -0
  47. model-00044-of-00117.safetensors +3 -0
  48. model-00045-of-00117.safetensors +3 -0
  49. model-00046-of-00117.safetensors +3 -0
  50. model-00047-of-00117.safetensors +3 -0
added_tokens.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "<|im_end|>": 32000,
3
+ "<|im_start|>": 32001
4
+ }
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "v2ray/Mixtral-8x22B-v0.1",
3
+ "architectures": [
4
+ "MixtralForCausalLM"
5
+ ],
6
+ "attention_dropout": 0.0,
7
+ "bos_token_id": 1,
8
+ "eos_token_id": 32000,
9
+ "hidden_act": "silu",
10
+ "hidden_size": 6144,
11
+ "initializer_range": 0.02,
12
+ "intermediate_size": 16384,
13
+ "max_position_embeddings": 65536,
14
+ "model_type": "mixtral",
15
+ "num_attention_heads": 48,
16
+ "num_experts_per_tok": 2,
17
+ "num_hidden_layers": 56,
18
+ "num_key_value_heads": 8,
19
+ "num_local_experts": 8,
20
+ "output_router_logits": false,
21
+ "rms_norm_eps": 1e-05,
22
+ "rope_theta": 1000000,
23
+ "router_aux_loss_coef": 0.001,
24
+ "router_jitter_noise": 0.0,
25
+ "sliding_window": null,
26
+ "tie_word_embeddings": false,
27
+ "torch_dtype": "float32",
28
+ "transformers_version": "4.40.0.dev0",
29
+ "use_cache": false,
30
+ "vocab_size": 32002
31
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 1,
4
+ "do_sample": true,
5
+ "eos_token_id": 2,
6
+ "transformers_version": "4.40.0.dev0"
7
+ }
model-00001-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcc5002691f06c27ac489e643fd3b9fc284146dece90ab388081b72c0a063f25
3
+ size 4762879840
model-00002-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1b5c31dea55980a9b646ce2494097e35e691e4295f21ff4ffeccd66b59ed7d1
3
+ size 4831839800
model-00003-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07ddbfaf55fb5e2415cab20829d5de5229556de6626b32f4d3d96bbc460be783
3
+ size 4781754592
model-00004-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f14147450632a545cb09c344640e6838ea893bb63484500c0827c36e58ed58d
3
+ size 4831839800
model-00005-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ded3ad7edcbe6edda24506d4d388bf081603e7bd8a12841a0959b1112eb26af
3
+ size 4781754592
model-00006-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b17c4d67b9454b7a10efb53d0163ee761408ff334f58af68aaa9db84972c949e
3
+ size 4831839800
model-00007-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c7753c82d8db058eed516df7ff10e511f0ae1a222a4882b9d15c209f9ecc73c
3
+ size 4781754592
model-00008-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b453fe7ec3831d08208c1bf8047665dad82cea0f14ae28fe5ce006f5ddec60b
3
+ size 4831839800
model-00009-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95207c5c18d23dddcc16d2399fd42f0cb4b4046b9abed4e6212eadace55ff1b7
3
+ size 4781754592
model-00010-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e7438ce11ba78f8aa53522b69df108c46756f606710549db1800e01f2557e99
3
+ size 4831839800
model-00011-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36d3bc159acdf00f775ba1caa94ff6a6011b4176de0321377474c2c7ab57531f
3
+ size 4781754592
model-00012-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:007fa45d011278e4f4ec26afcd2be2832dbdc4f5eeb9de4a951db8f2d8857cb3
3
+ size 4831839800
model-00013-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1958ca6d10b3c677786c9c9bd19e2ea417be9b102ed85d45c04ca55c0646b53
3
+ size 4781754592
model-00014-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc1064d5796463c81675cc1eacd2ea24425c0291e2610b074ccad46ac0edabe5
3
+ size 4831839800
model-00015-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38cf3fb19d18aa781b4779226c7a9e5026a09b001a04667ceb8f51c70903abd8
3
+ size 4781754592
model-00016-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7df301d9acde7f8f821e5992181a56ab2fe6283c42e0ded5d9b8c7a33289a245
3
+ size 4831839800
model-00017-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2918efe7c741c9f3081e6d74ed0bf9a01c0cceee8e7275a32e18ea1a76f4e507
3
+ size 4781754592
model-00018-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a71f6ed97aa70216934380dda6f5146880ed2aaef3caa0fd901ae07090ee2232
3
+ size 4831839800
model-00019-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23d513bdefe37af4b6fda7a57c85e19456a6401ab50126d53337842ab79c7931
3
+ size 4781754592
model-00020-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f519c89e124efe8b2dffffddf6df07ea3031e7df20410f58507d37a14211ddb
3
+ size 4831839800
model-00021-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3ae2674cce96785abe0c3f9b94a772d2aff88aa80eb103f0da30359aa12d7c1
3
+ size 4982884240
model-00022-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6731e496eb59b312aa94d70eff938ac8e3a6a9fcbe0fd47fb90280f1e837345f
3
+ size 4630710168
model-00023-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aad451806e84e57a11437ab1cb62a3946ff82df6e24392a78ae12ee1b99da90f
3
+ size 4831839808
model-00024-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8c919f3dfe5375cf24d277bb1162c1e307fe67872dfff8e35829b8c5f8a898b
3
+ size 4781754608
model-00025-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5726ff602cffd3c27bb930a5eaf1b2a7d33d382c6265ee532e9dc5ac21f7d77d
3
+ size 4831839808
model-00026-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a512f7d05c5433d3f2f194f0467a142c93fad0b9647ceda79d43b349835729a
3
+ size 4781754608
model-00027-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ebb1a3f8e8ee13b5c726865e8deec1c0251b4ef31fc4dd94bd564b836ce5d8d
3
+ size 4831839808
model-00028-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca2942fb7ca1738c4bc87e8074064db4ba897d08ae5b4f0fab3d9651773474d7
3
+ size 4781754608
model-00029-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:660bdb970d14f121685ec8ffc4470d2f40435f73f9cbc2f2dfe73abe5cecd84f
3
+ size 4831839808
model-00030-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6aadff68ad38925d9c5d2406aef4a212cc809864dbeb18569efc24347c34878
3
+ size 4781754608
model-00031-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef00d619f88d0a58c4a41cf18cc502eaf92c93fb869d07cebb060c042bc10490
3
+ size 4831839808
model-00032-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:090ab543c34b05951c3c224c01b84847dc9d962d2f038917ae8ee0c87f6a699a
3
+ size 4781754608
model-00033-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85a67db67088d7c47539b1de9d840a483e75e9da57c3ee83fba31be32c4a8cb9
3
+ size 4831839808
model-00034-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12416253fbb2f2f04c73f06778d10358c64309ae4ca71f58f2c99d07af3be8c2
3
+ size 4781754608
model-00035-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ef54fdc7dfb252ed1c96fef3b5cd11bff6b0346c628a9a7f2f34f30ef2d3397
3
+ size 4831839808
model-00036-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf215bac1467d9faf3bdc6ef5e121a265f22385dfb855067a73b218df957005f
3
+ size 4781754608
model-00037-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b3d8dd4fad431d1a3bd56aed46967ab8f87bf3e7915e7168abead5c7004ac7
3
+ size 4831839808
model-00038-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02cc26fb2c65c4b75f54768682527df9c74b5381e6265370d3eb131ee02bcc18
3
+ size 4781754608
model-00039-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cbecf08d21981d722f39679f66e7e8c3feaeec6b3bda3eb32cd08ed981e088f
3
+ size 4831839808
model-00040-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b48ac25c6be5f7dfc2eaa8beda016f89533ea1acd585935303268fd6bf184ad5
3
+ size 4781754608
model-00041-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36ae76284fd788bf98c43a432ba1966db37850371411abff57adc23d58398135
3
+ size 4831839808
model-00042-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c5832f523a3c1560ae7d6681a41847647c13ed7636110faaa9dbb268194d243
3
+ size 4781754608
model-00043-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03924b0a0c80b7f536f2bb18a734afff74d55181edcdf858fc8441fab11d4319
3
+ size 4831839808
model-00044-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1060b553bb346b9435012441f213a57c9e3f1c405d0ecff45f623cb270a566c7
3
+ size 4781754608
model-00045-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bd18421da6e09c9c49493888ebad34ea7fd62cdc25067a4e5bbd4ab89f7eca9
3
+ size 4831839808
model-00046-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e571cbeda4d7d3874da257e24accbf984e8428c1d44a38271ae7a9f962d4b5f
3
+ size 4982884256
model-00047-of-00117.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7343d02ed90f31e2c88b74d711426e13d7bdb3fd42cbebd40e646240c4ff2d94
3
+ size 4630710168