Upload folder using huggingface_hub

by awni - opened May 29

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+1538

-4945

Files changed (21) hide show

README.md +7 -3
config.json +1 -55
model-00001-of-00016.safetensors +3 -0
model-00002-of-00016.safetensors +3 -0
model-00003-of-00016.safetensors +3 -0
model-00004-of-00016.safetensors +3 -0
model-00005-of-00016.safetensors +3 -0
model-00006-of-00016.safetensors +3 -0
model-00007-of-00016.safetensors +3 -0
model-00008-of-00016.safetensors +3 -0
model-00009-of-00016.safetensors +3 -0
model-00010-of-00016.safetensors +3 -0
model-00011-of-00016.safetensors +3 -0
model-00012-of-00016.safetensors +3 -0
model-00013-of-00016.safetensors +3 -0
model-00014-of-00016.safetensors +3 -0
model-00015-of-00016.safetensors +3 -0
model-00016-of-00016.safetensors +3 -0
model.safetensors.index.json +0 -0
tokenizer.json +4 -4
tokenizer_config.json +14 -5

README.md CHANGED Viewed

@@ -1,15 +1,19 @@
 ---
 license: apache-2.0
 tags:
 - mlx
 ---
 # mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit
-This model was converted to MLX format from [`mistralai/Mixtral-8x22B-Instruct-v0.1`]() using mlx-lm version **0.9.0**.
-Model added by [Prince Canuma](https://twitter.com/Prince_Canuma).
-Refer to the [original model card](https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1) for more details on the model.
 ## Use with mlx
 ```bash

 ---
+language:
+- en
+- es
+- it
+- de
+- fr
 license: apache-2.0
 tags:
 - mlx
 ---
 # mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit
+The Model [mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit](https://huggingface.co/mlx-community/Mixtral-8x22B-Instruct-v0.1-4bit) was converted to MLX format from [mistralai/Mixtral-8x22B-Instruct-v0.1](https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1) using mlx-lm version **0.14.0**.
 ## Use with mlx
 ```bash

config.json CHANGED Viewed

@@ -1,87 +1,33 @@
 {
-    "add_cross_attention": false,
     "architectures": [
         "MixtralForCausalLM"
     ],
     "attention_dropout": 0.0,
-    "bad_words_ids": null,
-    "begin_suppress_tokens": null,
     "bos_token_id": 1,
-    "chunk_size_feed_forward": 0,
-    "cross_attention_hidden_size": null,
-    "decoder_start_token_id": null,
-    "diversity_penalty": 0.0,
-    "do_sample": false,
-    "early_stopping": false,
-    "encoder_no_repeat_ngram_size": 0,
     "eos_token_id": 2,
-    "exponential_decay_length_penalty": null,
-    "finetuning_task": null,
-    "forced_bos_token_id": null,
-    "forced_eos_token_id": null,
     "hidden_act": "silu",
     "hidden_size": 6144,
-    "id2label": {
-        "0": "LABEL_0",
-        "1": "LABEL_1"
-    },
     "initializer_range": 0.02,
     "intermediate_size": 16384,
-    "is_decoder": false,
-    "is_encoder_decoder": false,
-    "label2id": {
-        "LABEL_0": 0,
-        "LABEL_1": 1
-    },
-    "length_penalty": 1.0,
-    "max_length": 20,
     "max_position_embeddings": 65536,
-    "min_length": 0,
     "model_type": "mixtral",
-    "no_repeat_ngram_size": 0,
     "num_attention_heads": 48,
-    "num_beam_groups": 1,
-    "num_beams": 1,
     "num_experts_per_tok": 2,
     "num_hidden_layers": 56,
     "num_key_value_heads": 8,
     "num_local_experts": 8,
-    "num_return_sequences": 1,
-    "output_attentions": false,
-    "output_hidden_states": false,
     "output_router_logits": false,
-    "output_scores": false,
-    "pad_token_id": null,
-    "prefix": null,
-    "problem_type": null,
-    "pruned_heads": {},
     "quantization": {
         "group_size": 64,
         "bits": 4
     },
-    "remove_invalid_values": false,
-    "repetition_penalty": 1.0,
-    "return_dict": true,
-    "return_dict_in_generate": false,
     "rms_norm_eps": 1e-05,
     "rope_theta": 1000000.0,
     "router_aux_loss_coef": 0.001,
-    "sep_token_id": null,
     "sliding_window": null,
-    "suppress_tokens": null,
-    "task_specific_params": null,
-    "temperature": 1.0,
-    "tf_legacy_loss": false,
-    "tie_encoder_decoder": false,
     "tie_word_embeddings": false,
-    "tokenizer_class": null,
-    "top_k": 50,
-    "top_p": 1.0,
     "torch_dtype": "bfloat16",
-    "torchscript": false,
-    "transformers_version": "4.39.3",
-    "typical_p": 1.0,
-    "use_bfloat16": false,
     "use_cache": true,
     "vocab_size": 32768
 }

 {
     "architectures": [
         "MixtralForCausalLM"
     ],
     "attention_dropout": 0.0,
     "bos_token_id": 1,
     "eos_token_id": 2,
     "hidden_act": "silu",
     "hidden_size": 6144,
     "initializer_range": 0.02,
     "intermediate_size": 16384,
     "max_position_embeddings": 65536,
     "model_type": "mixtral",
     "num_attention_heads": 48,
     "num_experts_per_tok": 2,
     "num_hidden_layers": 56,
     "num_key_value_heads": 8,
     "num_local_experts": 8,
     "output_router_logits": false,
     "quantization": {
         "group_size": 64,
         "bits": 4
     },
     "rms_norm_eps": 1e-05,
     "rope_theta": 1000000.0,
     "router_aux_loss_coef": 0.001,
     "sliding_window": null,
     "tie_word_embeddings": false,
     "torch_dtype": "bfloat16",
+    "transformers_version": "4.38.0",
     "use_cache": true,
     "vocab_size": 32768
 }

model-00001-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5cb00f81c22e84f8628741581b2987b1df5ce708cff9c75c57da60b3f49e0d44
+size 5294456945

model-00002-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:52aac1cb6c0ea90b48aa14f922acde6d554fb110dcf310b45832c38d9ea4ddb9
+size 5181235243

model-00003-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c29ab95b851ac9b885c26204634a920823a889de187982871e0d9ce880a34af2
+size 5181235208

model-00004-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:65ba83e478b9ca58288bf852b09c95607c777b00b873134e5a383c561384157e
+size 5131635931

model-00005-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87ea5e7ed82936a2db1552948c468d906bd0aa4c02ac15517d9a1d93e4c5aa85
+size 5181235326

model-00006-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6cfc46bad182f82b317262e3edb4417a4f3223424299a6e349a495f8891ec293
+size 5181235312

model-00007-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6a0243b82ab8e8c73574241f182c2eed79b80033fa28f7de4c9eb4d9e3ace85e
+size 5131635949

model-00008-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b0482cd40b6483eca40ba6e46b9ad5d7e8fb936bec8caadbd5d0e8535e2a1de1
+size 5181235342

model-00009-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:503ba074eadbed6109d6fb57813837a26611c4e83c3f25f9d9537a9a451da9c7
+size 5181235294

model-00010-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c3f30c130dd5f537321695368c0472a7d4d61eaf621489c794ad81da7cdfbba0
+size 5131635917

model-00011-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6b34b30c966183f302d793d269f9e3c306ba50c5e785ca8056bc09a8a4a0a862
+size 5181235346

model-00012-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3a3f436e96b274d006048d55761cfbd036a471e517f3f2b79c49c89cf48e8f82
+size 5181235292

model-00013-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:afa09047699ab624c75d73cefa4f03ab3e2ace25f45c5080b1380a1600ddcc94
+size 5131635939

model-00014-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ed1c8918e483f47bb6b9f3404875c2d4e1cd27af6706358944ab4e49849d115
+size 5181235376

model-00015-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d34050a8e23ffb50edca240f64af73d46e532f4064c1b54b12c2ce21442f6563
+size 5181235324

model-00016-of-00016.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cef97915a74a5e172c21766b15e8ae734fdca4368b07bcd08b4455cce4f06357
+size 1472239423

model.safetensors.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.json CHANGED Viewed

@@ -76,8 +76,8 @@
       "special": true
     },
     {
-      "id": 9,
-      "content": "[/TOOL_RESULTS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
@@ -85,8 +85,8 @@
       "special": true
     },
     {
-      "id": 32768,
-      "content": "[TOOL_RESULT]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

       "special": true
     },
     {
+      "id": 8,
+      "content": "[TOOL_RESULTS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,
       "special": true
     },
     {
+      "id": 9,
+      "content": "[/TOOL_RESULTS]",
       "single_word": false,
       "lstrip": false,
       "rstrip": false,

tokenizer_config.json CHANGED Viewed

@@ -66,16 +66,16 @@
       "single_word": false,
       "special": true
     },
-    "9": {
-      "content": "[/TOOL_RESULTS]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
-    "32768": {
-      "content": "[TOOL_RESULT]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
@@ -85,7 +85,16 @@
   },
   "additional_special_tokens": [],
   "bos_token": "<s>",
-  "chat_template": "{{bos_token}}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ ' [INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "</s>",
   "legacy": true,

       "single_word": false,
       "special": true
     },
+    "8": {
+      "content": "[TOOL_RESULTS]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
       "single_word": false,
       "special": true
     },
+    "9": {
+      "content": "[/TOOL_RESULTS]",
       "lstrip": false,
       "normalized": true,
       "rstrip": false,
   },
   "additional_special_tokens": [],
   "bos_token": "<s>",
+  "chat_template": [
+    {
+      "name": "default",
+      "template": "{{bos_token}}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if message['role'] == 'user' %}{{ ' [INST] ' + message['content'] + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% else %}{{ raise_exception('Only user and assistant roles are supported!') }}{% endif %}{% endfor %}"
+    },
+    {
+      "name": "tool_use",
+      "template": "{{bos_token}}{% set user_messages = messages | selectattr('role', 'equalto', 'user') | list %}{% for message in messages %}{% if message['role'] == 'user' %}{% if message == user_messages[-1] %}{% if tools %}{{'[AVAILABLE_TOOLS]'+ tools|string + '[/AVAILABLE_TOOLS]'}}{% endif %}{{ '[INST]' + message['content'] + '[/INST]' }}{% else %}{{ '[INST]' + message['content'] + '[/INST]' }}{% endif %}{% elif message['role'] == 'assistant' %}{{ ' ' + message['content'] + ' ' + eos_token}}{% elif message['role'] == 'tool_results' %}{{'[TOOL_RESULTS]' + message['content']|string + '[/TOOL_RESULTS]'}}{% elif message['role'] == 'tool_calls' %}{{'[TOOL_CALLS]' + message['content']|string + eos_token}}{% endif %}{% endfor %}"
+    }
+  ],
   "clean_up_tokenization_spaces": false,
   "eos_token": "</s>",
   "legacy": true,