Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

README.md +63 -0
config.json +34 -0
mergekit_moe_config.yml +16 -0
model-00001-of-00001.safetensors +3 -0
model.safetensors.index.json +1 -0
special_tokens_map.json +24 -0
tokenizer.json +482 -0
tokenizer.model +3 -0
tokenizer_config.json +42 -0

README.md ADDED Viewed

	@@ -0,0 +1,63 @@

+---
+license: apache-2.0
+tags:
+- moe
+- frankenmoe
+- merge
+- mergekit
+- lazymergekit
+- Corianas/Microllama_Char_88k_step
+base_model:
+- Corianas/Microllama_Char_88k_step
+- Corianas/Microllama_Char_88k_step
+---
+# microchar_moe
+microchar_moe is a Mixture of Experts (MoE) made with the following models using [LazyMergekit](https://colab.research.google.com/drive/1obulZ1ROXHjYLn6PPZJwRR6GzgQogxxb?usp=sharing):
+* [Corianas/Microllama_Char_88k_step](https://huggingface.co/Corianas/Microllama_Char_88k_step)
+* [Corianas/Microllama_Char_88k_step](https://huggingface.co/Corianas/Microllama_Char_88k_step)
+## 🧩 Configuration
+```yaml
+base_model: Corianas/Microllama_Char_88k_step
+gate_mode: random # one of "hidden", "cheap_embed", or "random"
+dtype: bfloat16 # output dtype (float32, float16, or bfloat16)
+## (optional)
+# experts_per_token: 2
+experts:
+  - source_model: Corianas/Microllama_Char_88k_step
+    positive_prompts:
+      - ""
+    ## (optional)
+    # negative_prompts:
+    #   - "This is a prompt expert_model_1 should not be used for"
+  - source_model: Corianas/Microllama_Char_88k_step
+    positive_prompts:
+      - ""
+```
+## 💻 Usage
+```python
+!pip install -qU transformers bitsandbytes accelerate
+from transformers import AutoTokenizer
+import transformers
+import torch
+model = "Corianas/microchar_moe"
+tokenizer = AutoTokenizer.from_pretrained(model)
+pipeline = transformers.pipeline(
+    "text-generation",
+    model=model,
+    model_kwargs={"torch_dtype": torch.float16, "load_in_4bit": True},
+)
+messages = [{"role": "user", "content": "Explain what a Mixture of Experts is in less than 100 words."}]
+prompt = pipeline.tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
+outputs = pipeline(prompt, max_new_tokens=256, do_sample=True, temperature=0.7, top_k=50, top_p=0.95)
+print(outputs[0]["generated_text"])
+```

config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+  "_name_or_path": "Corianas/Microllama_Char_88k_step",
+  "architectures": [
+    "MixtralForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 2048,
+  "max_position_embeddings": 2048,
+  "model_type": "mixtral",
+  "num_attention_heads": 12,
+  "num_experts_per_tok": 2,
+  "num_hidden_layers": 12,
+  "num_key_value_heads": 12,
+  "num_local_experts": 2,
+  "output_router_logits": false,
+  "pad_token_id": 0,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 10000.0,
+  "router_aux_loss_coef": 0.001,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.39.1",
+  "use_cache": true,
+  "vocab_size": 341
+}

mergekit_moe_config.yml ADDED Viewed

	@@ -0,0 +1,16 @@

+base_model: Corianas/Microllama_Char_88k_step
+gate_mode: random # one of "hidden", "cheap_embed", or "random"
+dtype: bfloat16 # output dtype (float32, float16, or bfloat16)
+## (optional)
+# experts_per_token: 2
+experts:
+  - source_model: Corianas/Microllama_Char_88k_step
+    positive_prompts:
+      - ""
+    ## (optional)
+    # negative_prompts:
+    #   - "This is a prompt expert_model_1 should not be used for"
+  - source_model: Corianas/Microllama_Char_88k_step
+    positive_prompts:
+      - ""

model-00001-of-00001.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:681ff26ed7201c5981ae29a40350b5a0b0b211fee1d17309cbee821834e14d1f
+size 284257216

model.safetensors.index.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"metadata": {"mergekit_version": "0.0.4"}, "weight_map": {"model.embed_tokens.weight": "model-00001-of-00001.safetensors", "model.norm.weight": "model-00001-of-00001.safetensors", "lm_head.weight": "model-00001-of-00001.safetensors", "model.layers.0.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.1.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.2.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.3.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.4.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.5.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.6.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.7.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.8.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.9.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.10.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.11.input_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.0.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.0.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.1.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.1.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.2.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.2.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.3.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.3.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.4.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.4.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.5.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.5.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.6.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.6.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.7.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.7.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.8.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.8.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.9.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.9.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.10.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.10.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.11.block_sparse_moe.experts.0.w3.weight": "model-00001-of-00001.safetensors", "model.layers.11.block_sparse_moe.experts.1.w3.weight": "model-00001-of-00001.safetensors", "model.layers.0.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.0.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.1.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.1.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.2.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.2.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.3.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.3.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.4.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.4.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.5.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.5.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.6.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.6.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.7.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.7.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.8.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.8.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.9.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.9.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.10.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.10.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.11.block_sparse_moe.experts.0.w2.weight": "model-00001-of-00001.safetensors", "model.layers.11.block_sparse_moe.experts.1.w2.weight": "model-00001-of-00001.safetensors", "model.layers.0.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.0.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.1.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.1.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.2.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.2.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.3.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.3.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.4.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.4.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.5.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.5.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.6.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.6.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.7.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.7.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.8.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.8.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.9.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.9.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.10.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.10.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.11.block_sparse_moe.experts.0.w1.weight": "model-00001-of-00001.safetensors", "model.layers.11.block_sparse_moe.experts.1.w1.weight": "model-00001-of-00001.safetensors", "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.3.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.4.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.5.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.6.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.7.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.8.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.9.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.10.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.11.post_attention_layernorm.weight": "model-00001-of-00001.safetensors", "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.4.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.5.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.6.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.7.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.8.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.9.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.10.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.11.self_attn.q_proj.weight": "model-00001-of-00001.safetensors", "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.4.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.5.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.6.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.7.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.8.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.9.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.10.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.11.self_attn.k_proj.weight": "model-00001-of-00001.safetensors", "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.4.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.5.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.6.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.7.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.8.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.9.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.10.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.11.self_attn.v_proj.weight": "model-00001-of-00001.safetensors", "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.4.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.5.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.6.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.7.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.8.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.9.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.10.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.11.self_attn.o_proj.weight": "model-00001-of-00001.safetensors", "model.layers.0.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.1.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.2.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.3.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.4.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.5.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.6.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.7.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.8.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.9.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.10.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors", "model.layers.11.block_sparse_moe.gate.weight": "model-00001-of-00001.safetensors"}}

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,24 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<s>",
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,482 @@

+{
+  "version": "1.0",
+  "truncation": null,
+  "padding": null,
+  "added_tokens": [
+    {
+      "id": 0,
+      "content": "<unk>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 1,
+      "content": "<s>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    },
+    {
+      "id": 2,
+      "content": "</s>",
+      "single_word": false,
+      "lstrip": false,
+      "rstrip": false,
+      "normalized": false,
+      "special": true
+    }
+  ],
+  "normalizer": {
+    "type": "Sequence",
+    "normalizers": [
+      {
+        "type": "Prepend",
+        "prepend": "▁"
+      },
+      {
+        "type": "Replace",
+        "pattern": {
+          "String": " "
+        },
+        "content": "▁"
+      }
+    ]
+  },
+  "pre_tokenizer": null,
+  "post_processor": {
+    "type": "TemplateProcessing",
+    "single": [
+      {
+        "SpecialToken": {
+          "id": "<s>",
+          "type_id": 0
+        }
+      },
+      {
+        "Sequence": {
+          "id": "A",
+          "type_id": 0
+        }
+      }
+    ],
+    "pair": [
+      {
+        "SpecialToken": {
+          "id": "<s>",
+          "type_id": 0
+        }
+      },
+      {
+        "Sequence": {
+          "id": "A",
+          "type_id": 0
+        }
+      },
+      {
+        "SpecialToken": {
+          "id": "<s>",
+          "type_id": 1
+        }
+      },
+      {
+        "Sequence": {
+          "id": "B",
+          "type_id": 1
+        }
+      }
+    ],
+    "special_tokens": {
+      "<s>": {
+        "id": "<s>",
+        "ids": [
+          1
+        ],
+        "tokens": [
+          "<s>"
+        ]
+      }
+    }
+  },
+  "decoder": {
+    "type": "Sequence",
+    "decoders": [
+      {
+        "type": "Replace",
+        "pattern": {
+          "String": "▁"
+        },
+        "content": " "
+      },
+      {
+        "type": "ByteFallback"
+      },
+      {
+        "type": "Fuse"
+      },
+      {
+        "type": "Strip",
+        "content": " ",
+        "start": 1,
+        "stop": 0
+      }
+    ]
+  },
+  "model": {
+    "type": "BPE",
+    "dropout": null,
+    "unk_token": "<unk>",
+    "continuing_subword_prefix": null,
+    "end_of_word_suffix": null,
+    "fuse_unk": true,
+    "byte_fallback": true,
+    "vocab": {
+      "<unk>": 0,
+      "<s>": 1,
+      "</s>": 2,
+      "<0x00>": 3,
+      "<0x01>": 4,
+      "<0x02>": 5,
+      "<0x03>": 6,
+      "<0x04>": 7,
+      "<0x05>": 8,
+      "<0x06>": 9,
+      "<0x07>": 10,
+      "<0x08>": 11,
+      "<0x09>": 12,
+      "<0x0A>": 13,
+      "<0x0B>": 14,
+      "<0x0C>": 15,
+      "<0x0D>": 16,
+      "<0x0E>": 17,
+      "<0x0F>": 18,
+      "<0x10>": 19,
+      "<0x11>": 20,
+      "<0x12>": 21,
+      "<0x13>": 22,
+      "<0x14>": 23,
+      "<0x15>": 24,
+      "<0x16>": 25,
+      "<0x17>": 26,
+      "<0x18>": 27,
+      "<0x19>": 28,
+      "<0x1A>": 29,
+      "<0x1B>": 30,
+      "<0x1C>": 31,
+      "<0x1D>": 32,
+      "<0x1E>": 33,
+      "<0x1F>": 34,
+      "<0x20>": 35,
+      "<0x21>": 36,
+      "<0x22>": 37,
+      "<0x23>": 38,
+      "<0x24>": 39,
+      "<0x25>": 40,
+      "<0x26>": 41,
+      "<0x27>": 42,
+      "<0x28>": 43,
+      "<0x29>": 44,
+      "<0x2A>": 45,
+      "<0x2B>": 46,
+      "<0x2C>": 47,
+      "<0x2D>": 48,
+      "<0x2E>": 49,
+      "<0x2F>": 50,
+      "<0x30>": 51,
+      "<0x31>": 52,
+      "<0x32>": 53,
+      "<0x33>": 54,
+      "<0x34>": 55,
+      "<0x35>": 56,
+      "<0x36>": 57,
+      "<0x37>": 58,
+      "<0x38>": 59,
+      "<0x39>": 60,
+      "<0x3A>": 61,
+      "<0x3B>": 62,
+      "<0x3C>": 63,
+      "<0x3D>": 64,
+      "<0x3E>": 65,
+      "<0x3F>": 66,
+      "<0x40>": 67,
+      "<0x41>": 68,
+      "<0x42>": 69,
+      "<0x43>": 70,
+      "<0x44>": 71,
+      "<0x45>": 72,
+      "<0x46>": 73,
+      "<0x47>": 74,
+      "<0x48>": 75,
+      "<0x49>": 76,
+      "<0x4A>": 77,
+      "<0x4B>": 78,
+      "<0x4C>": 79,
+      "<0x4D>": 80,
+      "<0x4E>": 81,
+      "<0x4F>": 82,
+      "<0x50>": 83,
+      "<0x51>": 84,
+      "<0x52>": 85,
+      "<0x53>": 86,
+      "<0x54>": 87,
+      "<0x55>": 88,
+      "<0x56>": 89,
+      "<0x57>": 90,
+      "<0x58>": 91,
+      "<0x59>": 92,
+      "<0x5A>": 93,
+      "<0x5B>": 94,
+      "<0x5C>": 95,
+      "<0x5D>": 96,
+      "<0x5E>": 97,
+      "<0x5F>": 98,
+      "<0x60>": 99,
+      "<0x61>": 100,
+      "<0x62>": 101,
+      "<0x63>": 102,
+      "<0x64>": 103,
+      "<0x65>": 104,
+      "<0x66>": 105,
+      "<0x67>": 106,
+      "<0x68>": 107,
+      "<0x69>": 108,
+      "<0x6A>": 109,
+      "<0x6B>": 110,
+      "<0x6C>": 111,
+      "<0x6D>": 112,
+      "<0x6E>": 113,
+      "<0x6F>": 114,
+      "<0x70>": 115,
+      "<0x71>": 116,
+      "<0x72>": 117,
+      "<0x73>": 118,
+      "<0x74>": 119,
+      "<0x75>": 120,
+      "<0x76>": 121,
+      "<0x77>": 122,
+      "<0x78>": 123,
+      "<0x79>": 124,
+      "<0x7A>": 125,
+      "<0x7B>": 126,
+      "<0x7C>": 127,
+      "<0x7D>": 128,
+      "<0x7E>": 129,
+      "<0x7F>": 130,
+      "<0x80>": 131,
+      "<0x81>": 132,
+      "<0x82>": 133,
+      "<0x83>": 134,
+      "<0x84>": 135,
+      "<0x85>": 136,
+      "<0x86>": 137,
+      "<0x87>": 138,
+      "<0x88>": 139,
+      "<0x89>": 140,
+      "<0x8A>": 141,
+      "<0x8B>": 142,
+      "<0x8C>": 143,
+      "<0x8D>": 144,
+      "<0x8E>": 145,
+      "<0x8F>": 146,
+      "<0x90>": 147,
+      "<0x91>": 148,
+      "<0x92>": 149,
+      "<0x93>": 150,
+      "<0x94>": 151,
+      "<0x95>": 152,
+      "<0x96>": 153,
+      "<0x97>": 154,
+      "<0x98>": 155,
+      "<0x99>": 156,
+      "<0x9A>": 157,
+      "<0x9B>": 158,
+      "<0x9C>": 159,
+      "<0x9D>": 160,
+      "<0x9E>": 161,
+      "<0x9F>": 162,
+      "<0xA0>": 163,
+      "<0xA1>": 164,
+      "<0xA2>": 165,
+      "<0xA3>": 166,
+      "<0xA4>": 167,
+      "<0xA5>": 168,
+      "<0xA6>": 169,
+      "<0xA7>": 170,
+      "<0xA8>": 171,
+      "<0xA9>": 172,
+      "<0xAA>": 173,
+      "<0xAB>": 174,
+      "<0xAC>": 175,
+      "<0xAD>": 176,
+      "<0xAE>": 177,
+      "<0xAF>": 178,
+      "<0xB0>": 179,
+      "<0xB1>": 180,
+      "<0xB2>": 181,
+      "<0xB3>": 182,
+      "<0xB4>": 183,
+      "<0xB5>": 184,
+      "<0xB6>": 185,
+      "<0xB7>": 186,
+      "<0xB8>": 187,
+      "<0xB9>": 188,
+      "<0xBA>": 189,
+      "<0xBB>": 190,
+      "<0xBC>": 191,
+      "<0xBD>": 192,
+      "<0xBE>": 193,
+      "<0xBF>": 194,
+      "<0xC0>": 195,
+      "<0xC1>": 196,
+      "<0xC2>": 197,
+      "<0xC3>": 198,
+      "<0xC4>": 199,
+      "<0xC5>": 200,
+      "<0xC6>": 201,
+      "<0xC7>": 202,
+      "<0xC8>": 203,
+      "<0xC9>": 204,
+      "<0xCA>": 205,
+      "<0xCB>": 206,
+      "<0xCC>": 207,
+      "<0xCD>": 208,
+      "<0xCE>": 209,
+      "<0xCF>": 210,
+      "<0xD0>": 211,
+      "<0xD1>": 212,
+      "<0xD2>": 213,
+      "<0xD3>": 214,
+      "<0xD4>": 215,
+      "<0xD5>": 216,
+      "<0xD6>": 217,
+      "<0xD7>": 218,
+      "<0xD8>": 219,
+      "<0xD9>": 220,
+      "<0xDA>": 221,
+      "<0xDB>": 222,
+      "<0xDC>": 223,
+      "<0xDD>": 224,
+      "<0xDE>": 225,
+      "<0xDF>": 226,
+      "<0xE0>": 227,
+      "<0xE1>": 228,
+      "<0xE2>": 229,
+      "<0xE3>": 230,
+      "<0xE4>": 231,
+      "<0xE5>": 232,
+      "<0xE6>": 233,
+      "<0xE7>": 234,
+      "<0xE8>": 235,
+      "<0xE9>": 236,
+      "<0xEA>": 237,
+      "<0xEB>": 238,
+      "<0xEC>": 239,
+      "<0xED>": 240,
+      "<0xEE>": 241,
+      "<0xEF>": 242,
+      "<0xF0>": 243,
+      "<0xF1>": 244,
+      "<0xF2>": 245,
+      "<0xF3>": 246,
+      "<0xF4>": 247,
+      "<0xF5>": 248,
+      "<0xF6>": 249,
+      "<0xF7>": 250,
+      "<0xF8>": 251,
+      "<0xF9>": 252,
+      "<0xFA>": 253,
+      "<0xFB>": 254,
+      "<0xFC>": 255,
+      "<0xFD>": 256,
+      "<0xFE>": 257,
+      "<0xFF>": 258,
+      "▁": 259,
+      "e": 260,
+      "t": 261,
+      "a": 262,
+      "o": 263,
+      "h": 264,
+      "n": 265,
+      "s": 266,
+      "i": 267,
+      "r": 268,
+      "d": 269,
+      "l": 270,
+      "u": 271,
+      "w": 272,
+      "m": 273,
+      "↨": 274,
+      "g": 275,
+      "c": 276,
+      "f": 277,
+      "y": 278,
+      ".": 279,
+      "p": 280,
+      ",": 281,
+      "b": 282,
+      "\r": 283,
+      "k": 284,
+      "v": 285,
+      "\"": 286,
+      "'": 287,
+      "j": 288,
+      "x": 289,
+      "z": 290,
+      "q": 291,
+      "§": 292,
+      "?": 293,
+      "-": 294,
+      "!": 295,
+      ":": 296,
+      "1": 297,
+      "0": 298,
+      "2": 299,
+      "5": 300,
+      "3": 301,
+      ";": 302,
+      "4": 303,
+      "9": 304,
+      "8": 305,
+      "$": 306,
+      "6": 307,
+      "7": 308,
+      "+": 309,
+      "=": 310,
+      ")": 311,
+      "(": 312,
+      "&": 313,
+      "/": 314,
+      "%": 315,
+      "^": 316,
+      "*": 317,
+      "`": 318,
+      "_": 319,
+      "]": 320,
+      "<": 321,
+      "[": 322,
+      "\\": 323,
+      ">": 324,
+      "{": 325,
+      "}": 326,
+      "|": 327,
+      "¼": 328,
+      "½": 329,
+      "π": 330,
+      "←": 331,
+      "↑": 332,
+      "→": 333,
+      "↓": 334,
+      "▲": 335,
+      "►": 336,
+      "▼": 337,
+      "◄": 338,
+      "♪": 339,
+      "♫": 340
+    },
+    "merges": []
+  }
+}

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a9ecce7fdafd04b12010f1b0b21feb89a2c0495b6ff899fac1ba9a285f4abc5
+size 5543

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": true,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": true,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<s>",
+  "sp_model_kwargs": {},
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}