CharlieFRuan
commited on
Commit
•
91b7588
1
Parent(s):
05c4985
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +75 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,75 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q3f16_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 8192,
|
6 |
+
"intermediate_size": 28672,
|
7 |
+
"num_attention_heads": 64,
|
8 |
+
"num_hidden_layers": 80,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 128256,
|
11 |
+
"position_embedding_base": 500000.0,
|
12 |
+
"context_window_size": 8192,
|
13 |
+
"prefill_chunk_size": 1024,
|
14 |
+
"num_key_value_heads": 8,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 128256,
|
20 |
+
"context_window_size": 8192,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 1024,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "llama-3",
|
35 |
+
"system_template": "<|start_header_id|>system<|end_header_id|>\n\n{system_message}",
|
36 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
37 |
+
"system_prefix_token_ids": [
|
38 |
+
128000
|
39 |
+
],
|
40 |
+
"add_role_after_system_message": true,
|
41 |
+
"roles": {
|
42 |
+
"user": "user",
|
43 |
+
"assistant": "assistant"
|
44 |
+
},
|
45 |
+
"role_templates": {
|
46 |
+
"user": "{user_message}",
|
47 |
+
"assistant": "{assistant_message}",
|
48 |
+
"tool": "{tool_message}"
|
49 |
+
},
|
50 |
+
"messages": [],
|
51 |
+
"seps": [
|
52 |
+
"<|eot_id|><|start_header_id|>"
|
53 |
+
],
|
54 |
+
"role_content_sep": "<|end_header_id|>\n\n",
|
55 |
+
"role_empty_sep": "<|end_header_id|>\n\n",
|
56 |
+
"stop_str": [
|
57 |
+
"<|end_of_text|>",
|
58 |
+
"<|eot_id|>"
|
59 |
+
],
|
60 |
+
"stop_token_ids": [
|
61 |
+
128001,
|
62 |
+
128009
|
63 |
+
],
|
64 |
+
"function_string": "",
|
65 |
+
"use_function_calling": false
|
66 |
+
},
|
67 |
+
"pad_token_id": 0,
|
68 |
+
"bos_token_id": 128000,
|
69 |
+
"eos_token_id": 128001,
|
70 |
+
"tokenizer_files": [
|
71 |
+
"tokenizer.json",
|
72 |
+
"tokenizer_config.json"
|
73 |
+
],
|
74 |
+
"version": "0.1.0"
|
75 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d6d20e0b71a37518d4719073be0b9a77610a357bbe5957f830c433c11f9c24e
|
3 |
+
size 420679680
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24032d8f6b607fe15cd2bd179b737c0789b1782671e860e51fe2c7cae044bd9f
|
3 |
+
size 52584960
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77e5cf259458ca3db1cbad9bbc180bb251724aab2a366b2c5a81e9224a6efde0
|
3 |
+
size 23511040
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5e7fcfbd37aca09ee84795d1604f92e970f23e2e0d9f8f44b3fe22bf5bb2398
|
3 |
+
size 26869760
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78d2a40b662b35a34d036d771307c0efb198c74be6d5d83e921309a928feb500
|
3 |
+
size 31100928
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83240b129ee575ccea2816f332b5da695bc417f061ac8954dcb69e3ad7e22230
|
3 |
+
size 93978624
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c16566ef3ec5e933c7ceef4d36bbd688b08acbe1d1514989c5c1c4e38917785f
|
3 |
+
size 188088320
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c31d6d3b076796b426f84a61d4d56abfdfda5b9a4517f561b5b884e8f90feb9d
|
3 |
+
size 23511040
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2324503dd8d324a6ef56f1bddb9968cb877678f94a967a7be8b78817ba8cd326
|
3 |
+
size 33587200
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fceb03b3e75b0996319ebc68b99d2efcbb1a6306aa61ebb9cbbb389dafbba091
|
3 |
+
size 26869760
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fd021f6bb2bfd1b1b08b305bb8dac89484ae290211c1aa659e288a99e4cd4d5
|
3 |
+
size 93978624
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:979268ab2e211ec51caf1efcf25aac6be2b68789ba03da41f93ab33cfce63d8a
|
3 |
+
size 22712320
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8f90a96635d303a24a763c6634edbff8901c1bcc85998afb2c97cfad3f9373d
|
3 |
+
size 188088320
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ca2d29b7d1b48f1d7c7864f3dd43bc5d43377ef2df88b7d16bc0954c11c0406
|
3 |
+
size 33587200
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:881fa8f0089de8aadb51d14eadbaf632a0efd0dbb0b26d2578982cbdc70e0b61
|
3 |
+
size 23511040
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc99a700fe9141fdc6b2ca3a62e68a7dd1cc4b20d8a0d2d9f006ee6013098baf
|
3 |
+
size 33587200
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ca8bb8c3dfcc12d5fb046a80630e6bb12e170bfa3d16c24890ad336a6919a50
|
3 |
+
size 26869760
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:054c2f7a34e1bb3a2c30562927a5a52b2d16abcdba80dd8bd1f3396ff2ba94f2
|
3 |
+
size 93978624
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:edeedf04ce0660e8fa8d56719a727237a09c268ed1d3339c7cb80ac5ce22f145
|
3 |
+
size 188088320
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:556568ff581c16e5dfce47ec474c1de58c031399ab382df5676ccc4e6a14d42e
|
3 |
+
size 23511040
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e23d1806463bc8be0d9d1e37541d3e024aa7072234dfa8631e1b990bc4c1e1ab
|
3 |
+
size 33587200
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12dd50323b7d1a67ea4c35ad6f22c817a0ebe2a78b30800495be4f164253746d
|
3 |
+
size 31100928
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53ea81a01d6881c017e64a96cba5754b87a945002fbb9294233336a4f9183cc0
|
3 |
+
size 31068160
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab16cc898b978033c35cb22dcff7f88670246c33e1aa6049f3b8eb91d27fb29d
|
3 |
+
size 188088320
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f979793a64a197193e1acea2ec25c53d99c092cd09e9f15b610954cb4c887e48
|
3 |
+
size 26869760
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:605209f18f930aad56674cfc8c76fe13c940282be516d2983d4d1947ca7c4133
|
3 |
+
size 33587200
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4314be88603833c78ee45a0bec47abe4f487addee0ec763a35bcf593051de1a
|
3 |
+
size 26869760
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e4e9aeb64c785379827eb283aa0e55cba8cd5e86917c4b2325d2ecc8326955d
|
3 |
+
size 31068160
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f365f776ab96a67974c4131a38944d243baee8beb4b4e30e47975b1f83f1af8
|
3 |
+
size 93978624
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf353049ed569c90559712d5786b1c03b962b827c6344442c8820a10eeb3bdf9
|
3 |
+
size 93978624
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca081ef6446f865af9c65725964d5eec4a213dcbb4013fc30478a40742fe3919
|
3 |
+
size 188088320
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c8f360de5ac1b0ea51ec1beb34c6e165dce18f121c1f622a7a1ff53d644236b
|
3 |
+
size 23511040
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:721c6de84fb0c40899d6205356b60f28f71c76615b06d91e6042a3243b37e750
|
3 |
+
size 33587200
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:668be9b807c9b5c9a9d10e2413b09f3db7b4863ad03cf7cec220b596addc8ef8
|
3 |
+
size 26869760
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a20c4171c8e408541224f58f9c6681b12b95533c109a49311f9993721c504987
|
3 |
+
size 31117312
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c3c6e270217c91be350330961fd0e429a67ae9e747d6162d48c3a7fd4a9818c
|
3 |
+
size 93978624
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce1d0de7f92809fab0162ffacc569d8299ae73e608951646900a54a01a1808b5
|
3 |
+
size 93978624
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6a0a536d0eb2b0887268e71b6af186a2243cf23439ef92bc1b7991b6697cf0b
|
3 |
+
size 188088320
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd21825728eb6912f628d96ba219ec3172f701f970570cf91c9377526babe39c
|
3 |
+
size 23511040
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf832b6c4fd3af6302a91a16e84d8ac91cdc7a02edbb0b355a7e9f7384edbca9
|
3 |
+
size 33587200
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbbb86d1b157752d3dfc9583afa8fa9a04c6fc0a65183a40635fbe4134f6baa7
|
3 |
+
size 26869760
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:062f10a3f1da3dac52b01d0d61b6c8df7166c464ea7978f8fa9597f17ccfdd8b
|
3 |
+
size 188088320
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e341cbf9b1bb8aa1332174f018a60a4d8efa75ad2a4d223c60433b389f469bec
|
3 |
+
size 23511040
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0e66551776be65fba011099fcba662beb8316e2646d6036f78c2748851102dd
|
3 |
+
size 33587200
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03464fa39a92aa2a38dc640b727e32fccecfb43c5d1499a3c7783f69477b9271
|
3 |
+
size 26869760
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:76421b1d416b748f8cc33939f96f759542b630de3030a9b49f3a00a91ad57979
|
3 |
+
size 93978624
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5894673c9c10fd1593183af4e774d2f395a8547563a6d1c1bad9a78d7b3ad6ba
|
3 |
+
size 26910720
|