CharlieFRuan
commited on
Commit
•
e6a454e
1
Parent(s):
c9952f2
Initial commit
Browse files- logs.txt +0 -0
- merges.txt +0 -0
- mlc-chat-config.json +38 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_6.bin +3 -0
- params_shard_7.bin +3 -0
- params_shard_8.bin +3 -0
- params_shard_9.bin +3 -0
- tokenizer.json +0 -0
- vocab.json +0 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt2",
|
3 |
+
"quantization": "q0f16",
|
4 |
+
"model_config": {
|
5 |
+
"vocab_size": 50257,
|
6 |
+
"n_embd": 1024,
|
7 |
+
"n_layer": 24,
|
8 |
+
"n_head": 16,
|
9 |
+
"layer_norm_epsilon": 1e-05,
|
10 |
+
"n_inner": 4096,
|
11 |
+
"context_window_size": 1024,
|
12 |
+
"prefill_chunk_size": 1024,
|
13 |
+
"scale_attn_by_inverse_layer_idx": false,
|
14 |
+
"tensor_parallel_shards": 1
|
15 |
+
},
|
16 |
+
"vocab_size": 50257,
|
17 |
+
"context_window_size": 1024,
|
18 |
+
"sliding_window_size": -1,
|
19 |
+
"prefill_chunk_size": 1024,
|
20 |
+
"attention_sink_size": -1,
|
21 |
+
"tensor_parallel_shards": 1,
|
22 |
+
"mean_gen_len": 128,
|
23 |
+
"max_gen_len": 512,
|
24 |
+
"shift_fill_factor": 0.3,
|
25 |
+
"temperature": 0.7,
|
26 |
+
"repetition_penalty": 1.0,
|
27 |
+
"top_p": 0.95,
|
28 |
+
"conv_template": "gpt2",
|
29 |
+
"pad_token_id": 0,
|
30 |
+
"bos_token_id": 50256,
|
31 |
+
"eos_token_id": 50256,
|
32 |
+
"tokenizer_files": [
|
33 |
+
"tokenizer.json",
|
34 |
+
"vocab.json",
|
35 |
+
"merges.txt"
|
36 |
+
],
|
37 |
+
"version": "0.1.0"
|
38 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5bbf0ab20140082b6bd157c026ea52f4c3abb57657eccd26e03324541b0ab86
|
3 |
+
size 102926336
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5bbf0ab20140082b6bd157c026ea52f4c3abb57657eccd26e03324541b0ab86
|
3 |
+
size 102926336
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:075fa32067b9e31a9e43ad717824cff225383f718c3a2b5cedccf89571d93735
|
3 |
+
size 25192448
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15d9fcd9c32e4bc527ebd7cb4439f1b704b680fd39e6821cf635097ede0f8f19
|
3 |
+
size 25192448
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8b487d3a5cd9c9805b29624246ee5cae231649d5737921899f704091d208fd5
|
3 |
+
size 25192448
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5ed305a54ff5bef99466dc9ce54dc85051512cb7d69f421604c4c2ca2f9373f
|
3 |
+
size 25192448
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e8720eedb19b4cfd574d3666f20e07181fe2d5f7e7659dbb878f41a3d01df1f
|
3 |
+
size 25192448
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:093ae9fb01dfe042e38d74bd86f96c74571f6cb20eef75aa410e36861836a419
|
3 |
+
size 25192448
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d84dd8f76fe16e30dbd25071d30753075253106572b588e2d995bd3381ccfd2f
|
3 |
+
size 25192448
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:feccea78b3ef3156deb935eaab26571f92d6638a1622e9c8c94bc3da103ffe16
|
3 |
+
size 25192448
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe0f43931610dcb292c0a1f72750b0f7bf990e404deaea78fe297b152b51470c
|
3 |
+
size 25192448
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dceb785e3daf2715f79e260d602d766ff41a2bb3667ecdbd7a19519d0a427c6c
|
3 |
+
size 25192448
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f86d5865480bb06a8adc38c1d9efaa35d0245f6ce5908ccc14f1b53ab2d55789
|
3 |
+
size 27293696
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:728e03fb934aaa28f77760c5637c4c09ee0332ac2787be6bc9a3dfd0fb8020c1
|
3 |
+
size 25192448
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eeeeabee5fe04f5a615ea5a40510f13e9d585cd372673c8b99ec9d8932288c66
|
3 |
+
size 25192448
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94224f8a403f33c0c3ce81debd802dba5b985d8353614b3f408f8c07063e38c2
|
3 |
+
size 25192448
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3968b48c301513f3e5ebad14a91084032cd28b1e0fbf1fbfeca8754c9b6aef65
|
3 |
+
size 25192448
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7a04f105c17a6a49fd117b486b6df40cbcf764b7f54d61590a87504a04e2b36
|
3 |
+
size 25192448
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5f54fb9070ec8f4c57f6ef7686dc8045790e66888949d34ec8689b89572f859
|
3 |
+
size 16791552
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ad3e32c483a908c8b352cea55c5891a637536010adfd44ff2864368c2bcf1e3
|
3 |
+
size 31490048
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d98686613019db45569d7dd8709a947bfffae6cd9ede5f4c2a6dc2fba28b85a
|
3 |
+
size 27295744
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7389dc1c0842251cf41a64e9bd1e6273ff1bf5f807082d5daef454f4c0668dc
|
3 |
+
size 25192448
|
params_shard_6.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7085595bbf7a7f0e05e1aeed92d2371545559b282efb9a84771f30ba5374671
|
3 |
+
size 25192448
|
params_shard_7.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a60b888b17a0189c9a7439455e53424fd2fba9d5043962ea192ebaa4de37461
|
3 |
+
size 25192448
|
params_shard_8.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99696b59b767f8f0fbaf46c5e17ed88cc018be876a3e6587307cb31f24cd52ff
|
3 |
+
size 25192448
|
params_shard_9.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c05709e9eba5bc8c144f040a165f7f3a78edc7600fb78c509162775a98d58006
|
3 |
+
size 25192448
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|