Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +30 -0
- generation_config.json +6 -0
- model-00001-of-00063.safetensors +3 -0
- model-00002-of-00063.safetensors +3 -0
- model-00003-of-00063.safetensors +3 -0
- model-00004-of-00063.safetensors +3 -0
- model-00005-of-00063.safetensors +3 -0
- model-00006-of-00063.safetensors +3 -0
- model-00007-of-00063.safetensors +3 -0
- model-00008-of-00063.safetensors +3 -0
- model-00009-of-00063.safetensors +3 -0
- model-00010-of-00063.safetensors +3 -0
- model-00011-of-00063.safetensors +3 -0
- model-00012-of-00063.safetensors +3 -0
- model-00013-of-00063.safetensors +3 -0
- model-00014-of-00063.safetensors +3 -0
- model-00015-of-00063.safetensors +3 -0
- model-00016-of-00063.safetensors +3 -0
- model-00017-of-00063.safetensors +3 -0
- model-00018-of-00063.safetensors +3 -0
- model-00019-of-00063.safetensors +3 -0
- model-00020-of-00063.safetensors +3 -0
- model-00021-of-00063.safetensors +3 -0
- model-00022-of-00063.safetensors +3 -0
- model-00023-of-00063.safetensors +3 -0
- model-00024-of-00063.safetensors +3 -0
- model-00025-of-00063.safetensors +3 -0
- model-00026-of-00063.safetensors +3 -0
- model-00027-of-00063.safetensors +3 -0
- model-00028-of-00063.safetensors +3 -0
- model-00029-of-00063.safetensors +3 -0
- model-00030-of-00063.safetensors +3 -0
- model-00031-of-00063.safetensors +3 -0
- model-00032-of-00063.safetensors +3 -0
- model-00033-of-00063.safetensors +3 -0
- model-00034-of-00063.safetensors +3 -0
- model-00035-of-00063.safetensors +3 -0
- model-00036-of-00063.safetensors +3 -0
- model-00037-of-00063.safetensors +3 -0
- model-00038-of-00063.safetensors +3 -0
- model-00039-of-00063.safetensors +3 -0
- model-00040-of-00063.safetensors +3 -0
- model-00041-of-00063.safetensors +3 -0
- model-00042-of-00063.safetensors +3 -0
- model-00043-of-00063.safetensors +3 -0
- model-00044-of-00063.safetensors +3 -0
- model-00045-of-00063.safetensors +3 -0
- model-00046-of-00063.safetensors +3 -0
- model-00047-of-00063.safetensors +3 -0
- model-00048-of-00063.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "./alpaca_dragon",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": true,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 151643,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 24576,
|
14 |
+
"max_position_embeddings": 32768,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 64,
|
19 |
+
"pad_token_id": 151643,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-06,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 1000000,
|
24 |
+
"seq_length": 32768,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "float32",
|
27 |
+
"transformers_version": "4.37.2",
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 152064
|
30 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"eos_token_id": 151643,
|
4 |
+
"pad_token_id": 151643,
|
5 |
+
"transformers_version": "4.37.2"
|
6 |
+
}
|
model-00001-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93c877a3c02521f0fbff6812c0163a07aa9e3f24faaf2e7a0f4a3c6a78c88670
|
3 |
+
size 4982833288
|
model-00002-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a98c92f4b6c9b92499f5a70f4584d78fd06919349c551b15c3ab0f13ed9c68f
|
3 |
+
size 4563732824
|
model-00003-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8ef9240eafbfe9122a11f93867be86d7a0f530cab7a4efb725fc60dae382b22
|
3 |
+
size 4295165512
|
model-00004-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1092a4b6657ee63f3601103086485b0451017a9015f97bdccb4c1bd8b32b41ba
|
3 |
+
size 4295165504
|
model-00005-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7df17c368c979497868259e9579e0bb458f8a2eac72698cb867fa19555a72605
|
3 |
+
size 4832168168
|
model-00006-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55ceca019831eebb6f764caa7536e28b38bef6b9f7fc5fdf1ae0c532ddf56648
|
3 |
+
size 4832102408
|
model-00007-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffb7b82c2eb2b6a2419871ad961c1238be538b4558c39da97b7b452b6e898dc5
|
3 |
+
size 4295165504
|
model-00008-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0339c0a4e0a479449d2f5567592cc831293ee4473292374a9876dfc03dbe2ffb
|
3 |
+
size 4832168168
|
model-00009-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e19b35f13af81b46f3fe7af748108ef946a7ff870fd72831a9de014cfd3af9f
|
3 |
+
size 4832102424
|
model-00010-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4eb63611d3961db7c7d77c50c94ad724eaeb0ad2a4f2f2cb764016859189215
|
3 |
+
size 4295165520
|
model-00011-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d52a06da6f3fef5a7b9a5481ab4488e6ecc03b8cc148d9cacff1597b505d2707
|
3 |
+
size 4832168192
|
model-00012-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0a4ed319afc5686140a5864d5ac81b2ab5f5a002776fd847c0086f2dc88915f
|
3 |
+
size 4832102424
|
model-00013-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbf70fb5f207d5c6763bbfbb250b522103acb2761fa461c360dd1e194284cbdf
|
3 |
+
size 4295165520
|
model-00014-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97445490724b2bf6cb6c91d3690d8c7fd497c68a7bc0b3e5f72c9b60abcd2fce
|
3 |
+
size 4832168192
|
model-00015-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1a7cdbf94fdc3c9b51c0a9d98c95f73ab86890c5d9fe197634b44d69c156042
|
3 |
+
size 4832102424
|
model-00016-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc07681b1a1ca88cd62d03384d85a1aad3e2ef86f6a3f49643bad6931fc5b531
|
3 |
+
size 4295165520
|
model-00017-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39cf63b5cd0449d2d769184983591b0ede6ec17f161c69420939f00ab0454fb3
|
3 |
+
size 4832168192
|
model-00018-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92f478714d92e797071f350f5f826b17faecce3e01ca46b06526513781f0f4d9
|
3 |
+
size 4832102424
|
model-00019-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49ef74836db85e5a4f566e3e037508d859bf9d05c86c787b9569d5186abb3538
|
3 |
+
size 4295165520
|
model-00020-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dc8574d35ae909424828fbd08364d86b1fdd0bb464c1a50bd23df4f2a15751f
|
3 |
+
size 4832168192
|
model-00021-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9b1f6c33a14624e17f9a005637c6932fe30b21f06c960b2e8d465fb716058fa
|
3 |
+
size 4832102424
|
model-00022-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:048048e8183933c58dd5e8a99b0e3a914f77254a7bbad5d96f229d53fe5e14ce
|
3 |
+
size 4295165520
|
model-00023-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcb13d6b448b99d5ae4fcbe3783e4d4e6e1cac50995729651ba22544abae26b6
|
3 |
+
size 4832168192
|
model-00024-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d666e32bc6ea5920d5ba3293d182d7b7d245bf6132244c21559f78974d62c180
|
3 |
+
size 4832102424
|
model-00025-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35acb58a2404477d462292a2400b4eb988b1f456bb2c63eb499e785d296c7cd1
|
3 |
+
size 4295165520
|
model-00026-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e333fb348f29d300d9fc8133c0e2db3df308321365d7aad70c1da9c44ea5f6a
|
3 |
+
size 4832168192
|
model-00027-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c950d79a73fa37c6f9d4e4381c82bdf37c8c2cafdb867560a9687e94b0e542c5
|
3 |
+
size 4832102424
|
model-00028-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b26052c0d7f8bb8ec2736a9442deb6502d136fa526c5ad53ee6182c902993e9
|
3 |
+
size 4295165520
|
model-00029-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7db2e571dee48466331ec4ac9d557c43edd88e5a9fd738d398bfa3d067202554
|
3 |
+
size 4832168192
|
model-00030-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59231f35e5106fde9712aed2ddb4d68ea8f070e0f626cfe7754582cdab236101
|
3 |
+
size 4832102424
|
model-00031-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba27f21b1634dd8674efc645731129a33d0d2acea64d89ffc6968384742d895b
|
3 |
+
size 4295165520
|
model-00032-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7f446fd5792457f6cf64e8bc1db21695398381010a55f875d2c4b1addd05720
|
3 |
+
size 4832168192
|
model-00033-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f39b8b1c2d27a50f1ed36406cb6f72187fe3c8357fbf326281604eed2db3b3d0
|
3 |
+
size 4832102424
|
model-00034-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b1686f3badefd24ba6f6f3d4ff58d5e38cb77f0f977ad422681bc027706a27f
|
3 |
+
size 4295165520
|
model-00035-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b25358bfd1b371ddbf53b85df3bbd2bc2302a7fa07a24235188ccdef04cda9ad
|
3 |
+
size 4832168192
|
model-00036-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:17f404f15b70a54354bbcd5a45bdfa5d4fc3a0a2abc97022b90441003f41edba
|
3 |
+
size 4832102424
|
model-00037-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e15cf02d9a5cb926ad3f320ee1acf46251e6e02c6473a1aebcf870e992976cd
|
3 |
+
size 4295165520
|
model-00038-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07266edc388c35c263a07d447dfb4c225cf805a3bc24b48c53c830633b0556e6
|
3 |
+
size 4832168192
|
model-00039-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d651be88789177e0a8ce70e82ee6278a7fec5ee94bcd16af99308cd727b634b
|
3 |
+
size 4832102424
|
model-00040-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fdd57ea872b63a09afd309cfb3442c832e99b449312a10904c12748eea47f4ae
|
3 |
+
size 4295165520
|
model-00041-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60beed15b42fba44fdb075983e1f6a0264cb67b56c5877908e79f41a93838d7c
|
3 |
+
size 4832168192
|
model-00042-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c408e08466f8be2dcf7264fb337ceaeff351e8c7a39e967428e801a6ed5eb585
|
3 |
+
size 4832102424
|
model-00043-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5e3b218b504bdbdf2b5bb3b7017e7bf597b55dff983736ff8c48da9a84acec4
|
3 |
+
size 4295165520
|
model-00044-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f06faa7f70300c726c84aaf8bee2850e4545211cf973b71ac56d6cbb04e63ff4
|
3 |
+
size 4832168192
|
model-00045-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2df86e7efbedb5a47094453d26b0345c158dc18ac87a0ab43769e38e17603add
|
3 |
+
size 4832102424
|
model-00046-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7216c735fa661276eff0046564dde6934fb48628a18a44d6e0685a726215ebd2
|
3 |
+
size 4295165520
|
model-00047-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d699b7c928a7bb82416e6f4935bea583862a8d8dabd80d73624e874f19bf3804
|
3 |
+
size 4832168192
|
model-00048-of-00063.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfb80306a996c78c10a214df178fab9f873d8d5343f9f624bf43b05bb696420a
|
3 |
+
size 4832102424
|