mlabonne commited on
Commit
deb7de6
1 Parent(s): 5d27968

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -37,28 +37,13 @@
37
  "num_key_value_heads": 8,
38
  "output_router_logits": false,
39
  "pad_token_id": 0,
40
- "quantization_config": {
41
- "_load_in_4bit": true,
42
- "_load_in_8bit": false,
43
- "bnb_4bit_compute_dtype": "bfloat16",
44
- "bnb_4bit_quant_storage": "bfloat16",
45
- "bnb_4bit_quant_type": "nf4",
46
- "bnb_4bit_use_double_quant": true,
47
- "llm_int8_enable_fp32_cpu_offload": false,
48
- "llm_int8_has_fp16_weight": false,
49
- "llm_int8_skip_modules": null,
50
- "llm_int8_threshold": 6.0,
51
- "load_in_4bit": true,
52
- "load_in_8bit": false,
53
- "quant_method": "bitsandbytes"
54
- },
55
  "rms_norm_eps": 1e-06,
56
  "router_aux_loss_coef": 0.001,
57
  "sliding_window": null,
58
  "tie_word_embeddings": false,
59
- "torch_dtype": "bfloat16",
60
  "transformers_version": "4.40.0.dev0",
61
- "use_cache": false,
62
  "use_mamba_kernels": true,
63
  "vocab_size": 65536
64
  }
 
37
  "num_key_value_heads": 8,
38
  "output_router_logits": false,
39
  "pad_token_id": 0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  "rms_norm_eps": 1e-06,
41
  "router_aux_loss_coef": 0.001,
42
  "sliding_window": null,
43
  "tie_word_embeddings": false,
44
+ "torch_dtype": "float16",
45
  "transformers_version": "4.40.0.dev0",
46
+ "use_cache": true,
47
  "use_mamba_kernels": true,
48
  "vocab_size": 65536
49
  }
model-00001-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cc0b98c601e5bb0bded88ea064c4337c5b102a1ad3fb7cd3d6d29acfdf51015
3
  size 4951761080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfe5507ceb548347c102850080604bcbba8d1674a7f2d7dfb37ff00ea67d5d5e
3
  size 4951761080
model-00002-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:828ee733282f8582fa9dd04d184e60f7c0f4549188513a3f22d805b897c21562
3
  size 4884669232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8f575c195fcd5932dfd58475e7eff7c14aaf0626cf704613b3c6047143ad0b7
3
  size 4884669232
model-00003-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5a45a24e36be28c9c09247c1c94648eebcca2335eacdc5698590ab3a4f2420a
3
  size 4992556712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdb20936fa4210d05fb5c171b44a75b2d2941ac6dc9b484edd66e7bc1a342946
3
  size 4992556712
model-00004-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92523a366c5612544851a6109347a1bffcfa3df458fb5ebe306971fa44bb5ae1
3
  size 4958853128
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df9aab7ffcadbb60b99babfe2818bdc7dd481bbdf3aec8c4a3b8b9124b41c2ea
3
  size 4958853128
model-00005-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a770caddeacb3611187589b912c7e7affcc5be2b745436b8cbc8aa5ecd8d3b26
3
  size 4975763392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84ecf411de10628fafa6cb43d4dae135009987ea5cdfdb0563fe4aafbe9de903
3
  size 4975763392
model-00006-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6fff1213e72a6ae73195bf54b4ec506515601839bee848bc50c5067f248f716
3
  size 4884669224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:534e5cd73b106845ea6d877e56ccba37ba1a40cb7473ffb1b8f65a73ed9c98af
3
  size 4884669224
model-00007-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14db5f306f69f281563f81b6fa33be6f0fa8add66301ef9c213fe27c490e75b4
3
  size 4884669208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ccb1105abbbd78585ec6d24bf82c7fa5c01135e3590ab7edded2636023ac435
3
  size 4884669208
model-00008-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c021244b0f11333b488f48610521c986503a686e00d1059765fde1c31792c77
3
  size 4992556768
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e4e1a6dbef33a82f91e2f6a9fd679e016025c69a075e92fab509df5df266347
3
  size 4992556768
model-00009-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2762640be26982f608f990b05410964aaf302e8bf980c445846d7de47aada8b7
3
  size 4932506760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60805bf67aa6358246bee45e4395bfb190be2a328fcc59150a849008f88d19c6
3
  size 4932506760
model-00010-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e4942b8cd55670b10c4d40994a47df6d82a32a42be0232b46f61d00cbc5ed0b
3
  size 4884669272
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94fc40db7c2a47028ba6632264b8d13569510ea87ec146229992c32e4a547c32
3
  size 4884669272
model-00011-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fa5f1d047321a15f4ef227652b26edfd2ae77109791683d8ac1a8695294b11d
3
  size 4884669304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e50147baaa88c7f44ca32411d0838eb80205e18e8cbb74a743d398ed9aca17
3
  size 4884669304
model-00012-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f07939bee191a3ceff6f786174a7ab4691762c90537181a020ee2b95b36abba4
3
  size 4884669304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:279d24b323a30c1cd08fa0bdaa1aa99eac951c7bd18a638f00d4ed0d94227812
3
  size 4884669304
model-00013-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63490da867e9d817bd8f01a22d3c06b0e363fe1683b15ea427c188284e6f8757
3
  size 4932506760
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:682dbd1d6f1f80980b2cc299056e20cffc881804db6586a9393225acfce48594
3
  size 4932506760
model-00014-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c36ec3ad1f9b3fccda2a64358e94381e810b933fcbce69dfbb7369d77d5b91d8
3
  size 4992556728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2806ba91c1a08a2b4c43faa557fda1c80eec864e4460fcb1c900cbdcaff61bab
3
  size 4992556728
model-00015-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0abfd0863373d57c2f16868690c4d67357596fed9dfa35010c5acacd1ca73e1e
3
  size 4884669296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ed8e25592d21524cf7fb22f2484275b69cdef4fdd63994d5e7bccb97965a8ad
3
  size 4884669296
model-00016-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5813ce7a330b187a25568c4a15e0827bfa219c30fdfeb02e19fdb91a5fd09a35
3
  size 4884669304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a381e3d2aea054c5c7416ac229c1240525ea0ea540874088a6d9dc93e8e3df0
3
  size 4884669304
model-00017-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a64d30344848e9c5394a7d540de7ca8034e44ecc3c180f2d0acb8748852a8ba
3
  size 4908522432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a2193cde14711ed4df6f64a61f0ce4b968b1040147ae81d1af41a120bd24d89
3
  size 4908522432
model-00018-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e110d54a2239c2764ec6a947ea6a82dade230193cfe4eb93f293c9f8c2be9b05
3
  size 4908653584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:099c2368e4ec466f12d2b44eab2c83dbcc86922d5ad0d19262cae3fdd7b18c06
3
  size 4908653584
model-00019-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96b7a19b9172cc000d45a0509e8e8ebba06e786905b1efba2202203ed64c7c11
3
  size 4992556768
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:394d16766b6d7c3a17fb95b44066132f07d697f73cccabb47a18a43c2b9222b0
3
  size 4992556768
model-00020-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0bf4245bcb58ecd401cea5c94df1249dcd39114f5f287e9759ebb172e9198d41
3
  size 4884669304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fe94bda3d94c683ac2c22d9af82788abf526e6135fdf2bd9c306369792c7cac
3
  size 4884669304
model-00021-of-00021.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70650ab54909e09cee4372d9637878a9722e8ab44e19d0354d7fa4c6e5d62572
3
  size 4647318216
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aef6efd14616c45368806ba061773b84d8807f33417b1e76f39cf41800b2d38
3
  size 4647318216
tokenizer_config.json CHANGED
@@ -36,7 +36,6 @@
36
  }
37
  },
38
  "bos_token": "<|startoftext|>",
39
- "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
40
  "clean_up_tokenization_spaces": false,
41
  "eos_token": "<|endoftext|>",
42
  "model_max_length": 1000000000000000019884624838656,
 
36
  }
37
  },
38
  "bos_token": "<|startoftext|>",
 
39
  "clean_up_tokenization_spaces": false,
40
  "eos_token": "<|endoftext|>",
41
  "model_max_length": 1000000000000000019884624838656,