CharlieFRuan
commited on
Commit
•
fe0b8bb
1
Parent(s):
f8d7639
Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- mlc-chat-config.json +83 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,83 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "gemma2",
|
4 |
+
"quantization": "q4f32_1",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_size": 3584,
|
7 |
+
"intermediate_size": 14336,
|
8 |
+
"attention_bias": false,
|
9 |
+
"num_attention_heads": 16,
|
10 |
+
"num_key_value_heads": 8,
|
11 |
+
"head_dim": 256,
|
12 |
+
"num_hidden_layers": 42,
|
13 |
+
"rms_norm_eps": 1e-06,
|
14 |
+
"vocab_size": 256000,
|
15 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
16 |
+
"position_embedding_base": 10000.0,
|
17 |
+
"context_window_size": 4096,
|
18 |
+
"prefill_chunk_size": 2048,
|
19 |
+
"tensor_parallel_shards": 1,
|
20 |
+
"max_batch_size": 80,
|
21 |
+
"attn_logit_softcapping": 50.0,
|
22 |
+
"final_logit_softcapping": 30.0,
|
23 |
+
"query_pre_attn_scalar": 256,
|
24 |
+
"sliding_window": 4096
|
25 |
+
},
|
26 |
+
"vocab_size": 256000,
|
27 |
+
"context_window_size": 4096,
|
28 |
+
"sliding_window_size": -1,
|
29 |
+
"prefill_chunk_size": 2048,
|
30 |
+
"attention_sink_size": -1,
|
31 |
+
"tensor_parallel_shards": 1,
|
32 |
+
"temperature": 1.0,
|
33 |
+
"presence_penalty": 0.0,
|
34 |
+
"frequency_penalty": 0.0,
|
35 |
+
"repetition_penalty": 1.0,
|
36 |
+
"top_p": 1.0,
|
37 |
+
"tokenizer_files": [
|
38 |
+
"tokenizer.model",
|
39 |
+
"tokenizer.json",
|
40 |
+
"tokenizer_config.json"
|
41 |
+
],
|
42 |
+
"tokenizer_info": {
|
43 |
+
"token_postproc_method": "byte_fallback",
|
44 |
+
"prepend_space_in_encode": false,
|
45 |
+
"strip_space_in_decode": false
|
46 |
+
},
|
47 |
+
"conv_template": {
|
48 |
+
"name": "gemma_instruction",
|
49 |
+
"system_template": "{system_message}",
|
50 |
+
"system_message": "",
|
51 |
+
"system_prefix_token_ids": [
|
52 |
+
2
|
53 |
+
],
|
54 |
+
"add_role_after_system_message": true,
|
55 |
+
"roles": {
|
56 |
+
"user": "<start_of_turn>user",
|
57 |
+
"assistant": "<start_of_turn>model"
|
58 |
+
},
|
59 |
+
"role_templates": {
|
60 |
+
"user": "{user_message}",
|
61 |
+
"assistant": "{assistant_message}",
|
62 |
+
"tool": "{tool_message}"
|
63 |
+
},
|
64 |
+
"messages": [],
|
65 |
+
"seps": [
|
66 |
+
"<end_of_turn>\n"
|
67 |
+
],
|
68 |
+
"role_content_sep": "\n",
|
69 |
+
"role_empty_sep": "\n",
|
70 |
+
"stop_str": [
|
71 |
+
"<end_of_turn>"
|
72 |
+
],
|
73 |
+
"stop_token_ids": [
|
74 |
+
1,
|
75 |
+
107
|
76 |
+
],
|
77 |
+
"function_string": "",
|
78 |
+
"use_function_calling": false
|
79 |
+
},
|
80 |
+
"pad_token_id": 0,
|
81 |
+
"bos_token_id": 2,
|
82 |
+
"eos_token_id": 1
|
83 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c4d29ba7486f30331d513a1c4de834c358153a8c1330a598e8eaa3b6d85de90
|
3 |
+
size 458752000
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42a3e721c1e97748d45ac551301196e230bdce463f52acb66be2cc7fd3296248
|
3 |
+
size 57344000
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77cb98bfa068d53c54cbce1f1734a96b575ffd07f6f01b55990299f08d487d42
|
3 |
+
size 25690112
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a1a7666b94720273156571ae3ac6e455e2601dd73a5de90ff42176e310f2c78
|
3 |
+
size 32119808
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:704e609a00e03d84fecc1e959f10f952a9b0f5ebeab90e69600342b71d90f739
|
3 |
+
size 51380224
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebf80c20c73596302876cf689393ce1c1b11c057ee32e04e0a08f83cd36b60cd
|
3 |
+
size 32141312
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7eb4f8a606daf12c0d24d7984ce4f3d5dd1f1bf91e4e01ece771ecc846503c89
|
3 |
+
size 25690112
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92d9788ed20b7376cb95aae49e3e17bf136a0ea6ee226d41bc2592fa48005570
|
3 |
+
size 31223808
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a6e7dca51d6b089c8d7e9a9feca374b3d0ced403f7c0076c85abfebdac42673
|
3 |
+
size 51380224
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4f8ce9a43659690247dea3b40b01e051907abf82b05654cf21d2e02bf8b306b
|
3 |
+
size 33510400
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d691104159ecf1b23329628088d05a6166354247fd436c989e2f9b4270daa88
|
3 |
+
size 51380224
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:101dcd44db0754a9d467b90b5f44320e77e4624e25b7cdbf9ef021cb3f38db15
|
3 |
+
size 29826048
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b11eb1e35c64963d1bb304ab39e41da661b2013b5bc1b64fd13b36d817e7ced0
|
3 |
+
size 25690112
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9ea6fc6d57c40b89be56fefd0f562821976f3776dd4bf649de4ad707d7dc28e
|
3 |
+
size 31223808
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:018b422643cabe2bc0f88e82a3b975c1bf2b537cee6c769d981f61902d606d2e
|
3 |
+
size 31223808
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d280cf392451afe0aa19d2ebf2c3a8bdd62f6a0af8bc571ed0a07f78b91a5cb5
|
3 |
+
size 51380224
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf06d44cfc2a9c0b667f99b7a1b17777868f6bd0d21ed5c27ad83a3d7804692c
|
3 |
+
size 33510400
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c0e6548a7ef69114a1a5d6cc101e723a0d6573ee7177fd404a87fdc94a86134
|
3 |
+
size 51380224
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:023c37b12f242b4404823d6a37d65301691c8ccb40e32c28fa3ad97255452aea
|
3 |
+
size 29826048
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41591de0dc90ffdc644df8e24cbf55b63c1f95c86a1a14ab9ed96c49b1cd44d6
|
3 |
+
size 25690112
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7042f75ee430e8cdf6559ec73dd3e422f91231f76ad07b83a45dd892f61f626b
|
3 |
+
size 31223808
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5076461f7492aa78f6589fecae5c33eb2dca870c2b92b8ce64c1afa35e518a66
|
3 |
+
size 51380224
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2024cfd8327898a52b7a456e9d947cbf6a995fd494ad370c090312657aa03287
|
3 |
+
size 33510400
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6295faeeabdcd026965a9215313e30a63b684f3745613b018286d0c8a2d1854c
|
3 |
+
size 51380224
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ec35023927fec64909134f50de86f7ac865d70e6c6c2b693d71a25b29228c9d
|
3 |
+
size 51380224
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f65efabc1fffce3a0d782b385a4489f105112f2d49fef99ef1e68e873948736d
|
3 |
+
size 29826048
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:23e7af159f7c5fa957801597f6fde63ce1f5c37a28fa03545acb5b0049331db9
|
3 |
+
size 25690112
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a76efb42ccf023f547634684b50bed9d4b6cee511e22abc8641a4952e36b70d7
|
3 |
+
size 31223808
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59f538fc540a6fa1e218967200528e8f1e5064ecf4eb246607d6a0687fc4c8cf
|
3 |
+
size 51380224
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb63802352f47c73f5609a7b8dd6e6d35de19c22abc745d91b5f83117007a97e
|
3 |
+
size 33510400
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98b0f6d46f057ea76cb0d9aa0324050f49c6d021d4b6edc45eecfdde2feb0b1e
|
3 |
+
size 51380224
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a78d4ed5f9a972d78598bc3799fa2afdfc263397377a24029c27ffb8937825f4
|
3 |
+
size 29826048
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36ee2aca41a32c3c72d92fa59601cab1b213afa81bf07c63afdf3ecc4c3da3f7
|
3 |
+
size 31223808
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a78d60f56c2070277b3c6913ca3af506ea72f89cc2409a9ebd66078d8d8f1c45
|
3 |
+
size 33510400
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f60323a8b986d3e65320192a335618685475eb419403df6592f3d0e3e1966d8
|
3 |
+
size 51380224
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e83579ec062eb7c5f556f64ded0fc3421408f817a59d2b85f5c12edaec0f6272
|
3 |
+
size 29826048
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8bfaef6396764ad77eb80a028f27a40f3bc231a9ac7ab8480d895096bcf8279
|
3 |
+
size 25690112
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f5f2a31811926796bcb6de62654c84020f2a5d5980b4aa5c0733571cccbb4f4
|
3 |
+
size 31223808
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66428df3a1ba53aa83eb1ca242e4efcc2d31e4cf721861814ba85c980f39bd89
|
3 |
+
size 51380224
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66fdecdb686b85c51021fcb9a9d7589e82f5bb0941a0a516995a980fbf7ae0e9
|
3 |
+
size 33510400
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b0a49a3b4f1d33cbb4976335d0f6eca4b193da368f536076392996f4d01b64c3
|
3 |
+
size 51380224
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72a87f3aca4382f672f9d4cba887f54dfb2369561396d37643dd98632bb70243
|
3 |
+
size 51380224
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cad581472e0d6fcb26dbc7c4e9c0ebf079b9b947f267d8bf3e2a6f9c5e45bf4d
|
3 |
+
size 29826048
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17415c819a52c6c5c37024ca04187e406f981cc98caee10d5a9e3d610d85c9bd
|
3 |
+
size 51380224
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ece00a59d609581ebe3c75023ab0a2662aa7a94cbd06bc733739930139883911
|
3 |
+
size 31216640
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38b1d7359f90de4ca07fcc27e9668413c0d6f2f28405899f83af119a5509d0a8
|
3 |
+
size 25690112
|