CharlieFRuan
commited on
Commit
•
7352892
1
Parent(s):
d28ca51
Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +41 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
- params_shard_37.bin +3 -0
- params_shard_38.bin +3 -0
- params_shard_39.bin +3 -0
- params_shard_4.bin +3 -0
- params_shard_40.bin +3 -0
- params_shard_41.bin +3 -0
- params_shard_42.bin +3 -0
- params_shard_43.bin +3 -0
- params_shard_44.bin +3 -0
- params_shard_45.bin +3 -0
- params_shard_46.bin +3 -0
- params_shard_47.bin +3 -0
- params_shard_48.bin +3 -0
- params_shard_49.bin +3 -0
- params_shard_5.bin +3 -0
- params_shard_50.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "gpt_neox",
|
3 |
+
"quantization": "q4f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"use_parallel_residual": false,
|
6 |
+
"hidden_size": 2560,
|
7 |
+
"intermediate_size": 10240,
|
8 |
+
"num_attention_heads": 32,
|
9 |
+
"num_hidden_layers": 32,
|
10 |
+
"layer_norm_eps": 1e-05,
|
11 |
+
"vocab_size": 50432,
|
12 |
+
"rotary_pct": 1.0,
|
13 |
+
"position_embedding_base": 10000,
|
14 |
+
"context_window_size": 2048,
|
15 |
+
"head_dim": 80,
|
16 |
+
"prefill_chunk_size": 2048,
|
17 |
+
"tensor_parallel_shards": 1,
|
18 |
+
"ffn_out_dtype": "float32"
|
19 |
+
},
|
20 |
+
"vocab_size": 50432,
|
21 |
+
"context_window_size": 2048,
|
22 |
+
"sliding_window_size": -1,
|
23 |
+
"prefill_chunk_size": 2048,
|
24 |
+
"attention_sink_size": -1,
|
25 |
+
"tensor_parallel_shards": 1,
|
26 |
+
"mean_gen_len": 128,
|
27 |
+
"max_gen_len": 512,
|
28 |
+
"shift_fill_factor": 0.3,
|
29 |
+
"temperature": 0.7,
|
30 |
+
"repetition_penalty": 1.0,
|
31 |
+
"top_p": 0.95,
|
32 |
+
"conv_template": "redpajama_chat",
|
33 |
+
"pad_token_id": 0,
|
34 |
+
"bos_token_id": 0,
|
35 |
+
"eos_token_id": 0,
|
36 |
+
"tokenizer_files": [
|
37 |
+
"tokenizer.json",
|
38 |
+
"tokenizer_config.json"
|
39 |
+
],
|
40 |
+
"version": "0.1.0"
|
41 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a25be08771a487c48e25c57b7a224276c0f5a09e7f8609c7ba95df8c62934736
|
3 |
+
size 64552960
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc5b6ae4218087d3c6df03f7d04eb92c81b535f04492648c58266069d61adaf9
|
3 |
+
size 32604160
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a1279d3f2ea18fe7f71fa044371ce60fd0b9cc0919bf8e8b3eef1cff9b73457
|
3 |
+
size 32860160
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f419b3deed84d2400fd9abf44a6a2240973ed401fdeed8662114c94a62f73481
|
3 |
+
size 32860160
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bc0aa859314e51d70c280487e0e79f37da8f1ecebfc6fd8d4f9dd02ca8e986e
|
3 |
+
size 32849920
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6050352a5b0c54ef8b62581f7de896000b029437e755dac1ac4d0b9dcf56c4fa
|
3 |
+
size 32860160
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e67592a3b4727e76a0e7114bc53893ac445ba4bfd2c7c0cb64de8440e9cdb9ef
|
3 |
+
size 32860160
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3dc2024ebe77132ce5145912bb8ce192f01ff806cad84bcf5e6ed286e11db476
|
3 |
+
size 32849920
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dae7340a20c76cde781566bca8f8ab8fa804e09ce8a5ec72ea1245bb82f038ca
|
3 |
+
size 32860160
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6df91757ca3f52f00e3f0d9ca00e83c450ef88cd9046ee692d458a5d7b00ced8
|
3 |
+
size 32860160
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9a55f5f433b21cb71ccb1875715552ec485cb733e2729ab73f067e17086f665
|
3 |
+
size 32849920
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6274bf21d02be1890aef93190b2b8ec48c8181ebf6b6f88a0fc77af7e93890b0
|
3 |
+
size 32860160
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e9486d0e1f1ee5703adc8b21d1fa9881a3cb06f0217f593dd418737916cc041
|
3 |
+
size 32860160
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6fd618b40e1584369bfedb38cd309d04f2856fa4d2911a0d3b7682042eae5a0b
|
3 |
+
size 32860160
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7a23d595720d2dc28fafd555a2e024d3a9d6d5e1c99e8b65abf904301ff88c4
|
3 |
+
size 32849920
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99a46d36cb3f5ef44a0b5057e556ff74b18fbbf7ac7f9292ef765f38efff322d
|
3 |
+
size 32860160
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3eb4d6f44c1c169a5ba26a84ca1fcaaa8db1b9a7d635debfc45c0ee3b8f4820b
|
3 |
+
size 32860160
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d555d6bcaeec3705364a81f9b0124fcf5675d2ace5b1f5319782d850aadeae9
|
3 |
+
size 32849920
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:694e1161fb74e73625f38b38133616f96a2d1eaa45644a9ac94c4ccefd29ece3
|
3 |
+
size 32860160
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69511b7043efc00a32e2def1f047a02cdd8b98dce389efb3753ca9fba7a79c7d
|
3 |
+
size 32860160
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f0cafe7cb452a0f7ba02c52e746f108c17e35fecd5b863a82891a5999d7568a
|
3 |
+
size 32849920
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07b10bef3c9bd6a58b857ae22bb4f0a975998f109f716aceda18c9115b1cf6d2
|
3 |
+
size 32860160
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d6e49cca750819ba0c83ca58d0d8eb09b5e77b77abcfe821665e95aca80ab20
|
3 |
+
size 32860160
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e280f3d40053b39942b562eb0fec71ee511209b3ecba4433f65f6063fc4af0a2
|
3 |
+
size 32849920
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f5e2f9165615ff7ff38eb61734690fe5c0ae4214b96111a15e4501e91d02732
|
3 |
+
size 32849920
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34867af59dd99375066e2b961bece91be44e3481398d5bdb75d2ce37efda1fa9
|
3 |
+
size 32860160
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7af55bea5ecdb750c6ffa18d68166c813e9baf4893988770b4f071ab0c3ccb7
|
3 |
+
size 32860160
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cf5ce7a4353eb78d8cf2188622718eb4d1525c6038f2b23e5d176d3d9dcfb42
|
3 |
+
size 32849920
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dac73a88c23b0b1658336fd9ad90f6982a7c8df54c49a1a30c52841eec3ae334
|
3 |
+
size 32860160
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94d6e82a3037132912dbc5480eee6063a97a52d6937d4860b8d58dbcadb5ae1b
|
3 |
+
size 32860160
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2714637b14d3faea1bff2014a3674a90dd5b5c58939ff765b1a4a22ecfb9f4d
|
3 |
+
size 32849920
|
params_shard_37.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87b61f38dd908a736e748cabfa496db8f9bfafe4ebd45c751a32ca2d0f8bdd67
|
3 |
+
size 32860160
|
params_shard_38.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0852f7d1de9b249aea0138b74e7a941b17dba58c51b2120a035d4ece5a80d342
|
3 |
+
size 32860160
|
params_shard_39.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fd7ad2abbdfeb6f3b83d5f50394bb73a04d757d5d10f9f117827d64e658f234
|
3 |
+
size 32849920
|
params_shard_4.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd106cad57955c00cafcfdff28baf7e0dd9db76f741328481df71422af00affe
|
3 |
+
size 32860160
|
params_shard_40.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69aac50edd3c4fba4d5579ee7e037adbf63d3549ae017fd3619af16eddc71026
|
3 |
+
size 32860160
|
params_shard_41.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:824ef5827edb618fad8a041739a026ef89f0892545dc772e548df87a1d11109b
|
3 |
+
size 32860160
|
params_shard_42.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f806fd49403bff36fa2a606826b6fd5031cfda270082b9c7dff6feb799c1e8a3
|
3 |
+
size 32849920
|
params_shard_43.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9988f89d328815ec1f3eb5b8b822583ffe656a5ade885177a7d60aa5d4bbabc2
|
3 |
+
size 32860160
|
params_shard_44.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3104ddae472eb1adae4d90ffa780ad605b6921a192f7cda130108f3a25dadabf
|
3 |
+
size 32860160
|
params_shard_45.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1114187747c719dc7c5f255406ee06713a7045878cdd6537ec44ae82f21c4fb
|
3 |
+
size 32849920
|
params_shard_46.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85672120f25bfbf59285003067f92b5577975517a1a2d983a0e2f5b742587f00
|
3 |
+
size 32860160
|
params_shard_47.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef63a9e188a0d1a65a4d6160393b80ddc5bdb226d34c2ad0743b7408adbaaa43
|
3 |
+
size 32860160
|
params_shard_48.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dea63f47c2c6475c7ee04c80863a8d2fd2d6cd4903cb8f039b08b4c92666da55
|
3 |
+
size 32849920
|
params_shard_49.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:426de35565111a833338e679a58df3bdf4c5374daa127f526090eafd7ddfbc45
|
3 |
+
size 64552960
|
params_shard_5.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da761f2bcc98e4b30cefd04485ea30131d6fa9731ca6de9d818598ab9b5e77e0
|
3 |
+
size 32860160
|
params_shard_50.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d73947163ac6b921f36369f92dc3f64283d90905cd36257d4c4b1fbda96d8adc
|
3 |
+
size 32552960
|