leonardlin commited on Mar 31, 2024

Commit

d97abe5

verified ·

1 Parent(s): e06ffdb

Upload folder using huggingface_hub

Browse files

Files changed (28) hide show

config.json +49 -0
generation_config.json +8 -0
pytorch_model-00001-of-00021.bin +3 -0
pytorch_model-00002-of-00021.bin +3 -0
pytorch_model-00003-of-00021.bin +3 -0
pytorch_model-00004-of-00021.bin +3 -0
pytorch_model-00005-of-00021.bin +3 -0
pytorch_model-00006-of-00021.bin +3 -0
pytorch_model-00007-of-00021.bin +3 -0
pytorch_model-00008-of-00021.bin +3 -0
pytorch_model-00009-of-00021.bin +3 -0
pytorch_model-00010-of-00021.bin +3 -0
pytorch_model-00011-of-00021.bin +3 -0
pytorch_model-00012-of-00021.bin +3 -0
pytorch_model-00013-of-00021.bin +3 -0
pytorch_model-00014-of-00021.bin +3 -0
pytorch_model-00015-of-00021.bin +3 -0
pytorch_model-00016-of-00021.bin +3 -0
pytorch_model-00017-of-00021.bin +3 -0
pytorch_model-00018-of-00021.bin +3 -0
pytorch_model-00019-of-00021.bin +3 -0
pytorch_model-00020-of-00021.bin +3 -0
pytorch_model-00021-of-00021.bin +3 -0
pytorch_model.bin.index.json +0 -0
special_tokens_map.json +30 -0
tokenizer.json +0 -0
tokenizer.model +3 -0
tokenizer_config.json +48 -0

config.json ADDED Viewed

	@@ -0,0 +1,49 @@

+{
+  "_name_or_path": "ai21labs/Jamba-v0.1",
+  "architectures": [
+    "JambaForCausalLM"
+  ],
+  "attention_dropout": 0.0,
+  "attn_layer_offset": 4,
+  "attn_layer_period": 8,
+  "auto_map": {
+    "AutoConfig": "ai21labs/Jamba-v0.1--configuration_jamba.JambaConfig",
+    "AutoModel": "ai21labs/Jamba-v0.1--modeling_jamba.JambaModel",
+    "AutoModelForCausalLM": "ai21labs/Jamba-v0.1--modeling_jamba.JambaForCausalLM",
+    "AutoModelForSequenceClassification": "ai21labs/Jamba-v0.1--model.JambaForSequenceClassification"
+  },
+  "bos_token_id": 1,
+  "calc_logits_for_entire_prompt": false,
+  "eos_token_id": 2,
+  "expert_layer_offset": 1,
+  "expert_layer_period": 2,
+  "hidden_act": "silu",
+  "hidden_size": 4096,
+  "initializer_range": 0.02,
+  "intermediate_size": 14336,
+  "mamba_conv_bias": true,
+  "mamba_d_conv": 4,
+  "mamba_d_state": 16,
+  "mamba_dt_rank": 256,
+  "mamba_expand": 2,
+  "mamba_inner_layernorms": true,
+  "mamba_proj_bias": false,
+  "model_type": "jamba",
+  "n_ctx": 262144,
+  "num_attention_heads": 32,
+  "num_experts": 16,
+  "num_experts_per_tok": 2,
+  "num_hidden_layers": 32,
+  "num_key_value_heads": 8,
+  "output_router_logits": false,
+  "pad_token_id": 0,
+  "rms_norm_eps": 1e-06,
+  "router_aux_loss_coef": 0.001,
+  "sliding_window": null,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.40.0.dev0",
+  "use_cache": false,
+  "use_mamba_kernels": true,
+  "vocab_size": 65536
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "do_sample": true,
+  "eos_token_id": 2,
+  "pad_token_id": 0,
+  "transformers_version": "4.40.0.dev0"
+}

pytorch_model-00001-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61117544894b526921f20bb23574bd098ebc9323d948b378ec48e594340b2522
+size 4951250886

pytorch_model-00002-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d5b85999a872c32ac676ff0c9bf3fc75c425b4f3b1beffc7188eeb58776bf10
+size 4884160124

pytorch_model-00003-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a80fac1f62308791207f2d91aafd29763a8412d34f51e912ad4100d2fc5c046b
+size 4992308496

pytorch_model-00004-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef8192c17bfad16dd55fb6fd6cbc1535c505070756c00673da98a418b18dab9d
+size 4958602752

pytorch_model-00005-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4c00e0dfce22a7e06f0c8a3aa3511feecb2b290f02847a6ac211183b0101477a
+size 4975514704

pytorch_model-00006-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a64125f3064b25672848161fbc9a76912547457608d65b6a1804c96ea1b82f5b
+size 4884160124

pytorch_model-00007-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:07688c7108339b1a7af2007d1e3a148bf053ac09fc10021e8d2a19761c368c59
+size 4884160188

pytorch_model-00008-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b3acf958bc63b6ef7ddd76a1d514320b0ee8e1de2b00c07a035f27602d1873e
+size 4992308808

pytorch_model-00009-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab67d56f9f601cdf22e5eaae2975eb81779384052e4298466119a0d95d1071bd
+size 4932516474

pytorch_model-00010-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf11a69fec0e125569ebbd4514fca69979cad5529404d4f78027e273b44e75d6
+size 4884160224

pytorch_model-00011-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d792c8a0da576758d5354cddd3633473715bf95e62f0708832d62e5ac29526bd
+size 4884160188

pytorch_model-00012-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb762ea4287fcc80fbc658c7828172c42b1b32d11b849ba23b8f1369d259a621
+size 4884160188

pytorch_model-00013-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f53c2a11c78a39998fa22d4864b8258ab12104b53b851d25449bf49bded71296
+size 4932516474

pytorch_model-00014-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f786a6a2079803a928fe449852a1f65066b76e16440df63bf4d6e6dd7902f7b9
+size 4992308532

pytorch_model-00015-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6655b55f311ebd89715715d0672df81f83e2732cd60ec68a2a648c48a7264167
+size 4884160188

pytorch_model-00016-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:113bda65d155000d6e8ec469bb00388cdd3f136f54084451789ac7fa1f24c1e6
+size 4884160188

pytorch_model-00017-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:64d697b3882f784632c8ec09164bbb5f6a110e55c712d6cc30a2a79fed4424f7
+size 4908272822

pytorch_model-00018-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:01ea3b6d47021a84ce4f70da51db5c1ca57a09e455bb8c801952551a6d21fdbd
+size 4908404040

pytorch_model-00019-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0fe480d2b418201551ec14c12f29826e496d567adea9e4affccfe03a64894a7a
+size 4992308496

pytorch_model-00020-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fe93e1e8b40d9583142ce5eac58ed7e55f168b479601f2518e5238674eaa7984
+size 4884160188

pytorch_model-00021-of-00021.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:272ed20632179b7664a9abbcb31800ab127c34b3d21bac9918758a9dd9dbd394
+size 4647327276

pytorch_model.bin.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,30 @@

+{
+  "bos_token": {
+    "content": "<|startoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<|pad|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<|unk|>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:02fd6530b8ede0eedd8e509fcab32da7b1dd04c8119f8498c787100f13112713
+size 1124742

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,48 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<|pad|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<|startoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<|endoftext|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<|unk|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<|startoftext|>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<|endoftext|>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<|pad|>",
+  "spaces_between_special_tokens": false,
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<|unk|>",
+  "use_default_system_prompt": false,
+  "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}"
+}