diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0dbc3ff27ae6f6f8ae0e186767cfb0b8102aefe7 --- /dev/null +++ b/config.json @@ -0,0 +1,24 @@ +{ + "_name_or_path": "decapoda-research/llama-13b-hf", + "architectures": [ + "LlamaForCausalLM" + ], + "bos_token_id": 0, + "eos_token_id": 1, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "intermediate_size": 13824, + "max_position_embeddings": 2048, + "max_sequence_length": 2048, + "model_type": "llama", + "num_attention_heads": 40, + "num_hidden_layers": 40, + "pad_token_id": -1, + "rms_norm_eps": 1e-06, + "tie_word_embeddings": false, + "torch_dtype": "float16", + "transformers_version": "4.28.0.dev0", + "use_cache": true, + "vocab_size": 32000 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..128b48946713166edcc3e3c62ae5fe285df776be --- /dev/null +++ b/generation_config.json @@ -0,0 +1,7 @@ +{ + "_from_model_config": true, + "bos_token_id": 0, + "eos_token_id": 1, + "pad_token_id": 0, + "transformers_version": "4.28.0.dev0" +} diff --git a/pytorch_model-00001-of-00082.bin b/pytorch_model-00001-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1072b0ea799e7157fa17a65e531ff8e5c7d7d24 --- /dev/null +++ b/pytorch_model-00001-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:682e511e31ff864f5142ba57dd9cef2fdb79151e5c7a376ebaab2808b2fe5c58 +size 380110075 diff --git a/pytorch_model-00002-of-00082.bin b/pytorch_model-00002-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..53e50dcf4f62f93537622af7f261b78281e08d28 --- /dev/null +++ b/pytorch_model-00002-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ea28885c43bdd3167695b2514b77aea3178ef7e79d42de2340a009d711e80e +size 298846638 diff --git a/pytorch_model-00003-of-00082.bin b/pytorch_model-00003-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2470543445e61c0f48fb1cf71a038ae378aa170f --- /dev/null +++ b/pytorch_model-00003-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37b2c68a1e85c0b230208757e64667d644bb293ea9d61e191474f2702e2f682 +size 705190126 diff --git a/pytorch_model-00004-of-00082.bin b/pytorch_model-00004-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed5b4efe7d64dbd910229a2b2254037890e6dd63 --- /dev/null +++ b/pytorch_model-00004-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c54c2e17f040b8c0933f5dc44fc7e74a98c7855bb3f1f9973b86f4081c345c +size 387975598 diff --git a/pytorch_model-00005-of-00082.bin b/pytorch_model-00005-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2159d0b2adb4bada17601368064f88db91a1dc96 --- /dev/null +++ b/pytorch_model-00005-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e6b1f6354c9f303b70bfadc5236e72db3dfe9f416e31a47298416d0b42e0edf +size 668490896 diff --git a/pytorch_model-00006-of-00082.bin b/pytorch_model-00006-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..357a8e07dc9f069a793a4cb5c772dc927222dd27 --- /dev/null +++ b/pytorch_model-00006-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc1c552640ca98eb953174f314be35003e7d0a83cd66876dfc2503213d47599 +size 283116795 diff --git a/pytorch_model-00007-of-00082.bin b/pytorch_model-00007-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..072c6c50e543a002265d4efc54d81335b1778c74 --- /dev/null +++ b/pytorch_model-00007-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f750f16823ae560423d47bcc0c8d58c2748eda8769703ed0d7f05b91d07069f8 +size 668490896 diff --git a/pytorch_model-00008-of-00082.bin b/pytorch_model-00008-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8677493c4cd36c57b2e669f2567150c869840cbc --- /dev/null +++ b/pytorch_model-00008-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d80edfca8890f5fa22322cd6a7a074cf8ac967766693d97adc3169ea734ad75 +size 283116795 diff --git a/pytorch_model-00009-of-00082.bin b/pytorch_model-00009-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..28c35747b1606f2b613fd847f8fd53197d631b22 --- /dev/null +++ b/pytorch_model-00009-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7022a4dabc929b08f461b2f6c0237a12edbc5f051e81c8e585c9fac9cc6071a1 +size 668490896 diff --git a/pytorch_model-00010-of-00082.bin b/pytorch_model-00010-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d03ddd77c776a7649998f759a802c0e1288c0282 --- /dev/null +++ b/pytorch_model-00010-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e29f91a92127ef330e71f0f664b8d3ada8526427ed6ef8a85efd6a668b8f60 +size 283116795 diff --git a/pytorch_model-00011-of-00082.bin b/pytorch_model-00011-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..72bfa45ca58061845afc0dbb3386f9d8c9d068b9 --- /dev/null +++ b/pytorch_model-00011-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18d8f4b02ac24c9e40d9cbd24d53dbb35793906acf40f070e6f9bfbc8b8fe8ea +size 668490896 diff --git a/pytorch_model-00012-of-00082.bin b/pytorch_model-00012-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dc44cc388c43ef7552244a052ad564c31739a0a --- /dev/null +++ b/pytorch_model-00012-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26136f021a572bc5545c45366793f328b27ba7a817169e882ee43512ed920986 +size 283116795 diff --git a/pytorch_model-00013-of-00082.bin b/pytorch_model-00013-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8eb1b4eb4c8fdfbfc7aa7263618caba2c3c2085a --- /dev/null +++ b/pytorch_model-00013-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:298403c4a544fce56b2991f78b38f776757233daa01bb1abb88388e3c4181f38 +size 668490896 diff --git a/pytorch_model-00014-of-00082.bin b/pytorch_model-00014-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f76074b851a2e0adb596955f2cebbf4624d6d176 --- /dev/null +++ b/pytorch_model-00014-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad550ac7984955710c3aef53b3cf44b675736373cced6bdde2c10bd90fd05e00 +size 283116795 diff --git a/pytorch_model-00015-of-00082.bin b/pytorch_model-00015-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba54accd738d71bb233069498ac487c6c839c636 --- /dev/null +++ b/pytorch_model-00015-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbac8a4013ade62597f004722b24cd987565c579449aa3291142e975f58b1c5b +size 668490896 diff --git a/pytorch_model-00016-of-00082.bin b/pytorch_model-00016-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..10ee4d4ffbd2be738c61b5d2955e77e90b648284 --- /dev/null +++ b/pytorch_model-00016-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8291046bbb599b31c293ce23e3174a87834c97e765d37aff394a8227c120ffcb +size 283116795 diff --git a/pytorch_model-00017-of-00082.bin b/pytorch_model-00017-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e7f1c9e46b4009af24ad5f23cef49cfe04e4a48 --- /dev/null +++ b/pytorch_model-00017-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5aa2ed4049053449b3d09ff6d3221e4417a79d519a655aacd6acb9d103280b3 +size 668490896 diff --git a/pytorch_model-00018-of-00082.bin b/pytorch_model-00018-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e6e67161e363674e5933b9ebc814b107e6e76d1 --- /dev/null +++ b/pytorch_model-00018-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25c2a779547ff1bfea36dd16d6ce68844d784c3594f502aa8279723fbb54bfc +size 283116795 diff --git a/pytorch_model-00019-of-00082.bin b/pytorch_model-00019-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8d703728389d27cb216f728a22b07a95d1942a7 --- /dev/null +++ b/pytorch_model-00019-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cebff0bcbd0a6238b739fbf8bb76a0a3070056986caaab71d73032fe4374cf9a +size 668490896 diff --git a/pytorch_model-00020-of-00082.bin b/pytorch_model-00020-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..edfb3fbb39b468301570d6f86d87706d92294cd7 --- /dev/null +++ b/pytorch_model-00020-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf8ba21239f070b3dddf08b428a032ec1a0f0b97adf91d614db67685b8a2f3c +size 283116795 diff --git a/pytorch_model-00021-of-00082.bin b/pytorch_model-00021-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d0d5a54102dbf7012b6537b5ec6b072910e91f2 --- /dev/null +++ b/pytorch_model-00021-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab524b969e61498835b1aefee4c414a2f4c2aead303448b13175a541f6cd22d5 +size 668490896 diff --git a/pytorch_model-00022-of-00082.bin b/pytorch_model-00022-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..08e30781089efed1fc42331db4943b7eec37c22d --- /dev/null +++ b/pytorch_model-00022-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c538c86a2cb6f36a03ee39afeb1fbd580c169b6d25b27108e3a6539b68cd8f1 +size 283116795 diff --git a/pytorch_model-00023-of-00082.bin b/pytorch_model-00023-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea74e26a3d4d7f55e99931bd4a4d482d02e392ee --- /dev/null +++ b/pytorch_model-00023-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19a55bd4c75817e651163a97c22009a48e55b5e5b5e95e33546c477c5ae9f847 +size 668490896 diff --git a/pytorch_model-00024-of-00082.bin b/pytorch_model-00024-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad36a39e79b2883251924da5f297a8870441a325 --- /dev/null +++ b/pytorch_model-00024-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6591f1b2560ba2159919148ccd3d14edc04503f2d006ed1b15b57c57f626e9e9 +size 283116795 diff --git a/pytorch_model-00025-of-00082.bin b/pytorch_model-00025-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b5aea0a89e497e1d7c02d3213db32593a28a6ff8 --- /dev/null +++ b/pytorch_model-00025-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fa9a5367a44a30e1d149468e8982d8fb7d4f81622f7db2a2b1669ef16cedf98 +size 668490896 diff --git a/pytorch_model-00026-of-00082.bin b/pytorch_model-00026-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b1d3ef696bb24a46397b4b177c482422026f37b --- /dev/null +++ b/pytorch_model-00026-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eee6652908ce206baf7357d9f5d8ad301a8f8d79428aec99ef7dec3b32e646 +size 283116795 diff --git a/pytorch_model-00027-of-00082.bin b/pytorch_model-00027-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..710e857eaf3b380dd6679fc7dd8f8ad0b084c011 --- /dev/null +++ b/pytorch_model-00027-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c689dd3d97e13df6f0cd1b5e80cb0bf08f6e1e91fa57756aa7f534c68c49d21 +size 668490896 diff --git a/pytorch_model-00028-of-00082.bin b/pytorch_model-00028-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8bc06c4502866ee765ff1742345d92fd8a518579 --- /dev/null +++ b/pytorch_model-00028-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4242a2a58ee759158f020d7164b669b278a82c23eba7c40ba9e25068c2b91ce +size 283116795 diff --git a/pytorch_model-00029-of-00082.bin b/pytorch_model-00029-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a1fdc116977ccce5e710b2a2296e227805c233c --- /dev/null +++ b/pytorch_model-00029-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7b1297ff4ba3b71802930a3a930f8e4137caab87e0ed3c74eee8b9a951cdf8b +size 668490896 diff --git a/pytorch_model-00030-of-00082.bin b/pytorch_model-00030-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..008b4aa2912bc378c15b46bafc75976237f22116 --- /dev/null +++ b/pytorch_model-00030-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1dc8c99a219094b4464fa6c4e7d16de5851ed53b1a94444c6f8045a5ebef9a +size 283116795 diff --git a/pytorch_model-00031-of-00082.bin b/pytorch_model-00031-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2565e59b165e334cea7946b0faa517ce3ff39429 --- /dev/null +++ b/pytorch_model-00031-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db4c4d565dd4538e5426c663428eff281fc407be53792d62eefaf48091e4f17c +size 668490896 diff --git a/pytorch_model-00032-of-00082.bin b/pytorch_model-00032-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa184fc30de69e72b83ada5d64de91de9c5af5ee --- /dev/null +++ b/pytorch_model-00032-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d21051227d43ddb58ae705034715939d70ada16a19c8d009003779174b62ad7 +size 283116795 diff --git a/pytorch_model-00033-of-00082.bin b/pytorch_model-00033-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb880d4bdc0fb27a303f64084f24cad7d7eed3f2 --- /dev/null +++ b/pytorch_model-00033-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5185d4b391f112018e2ceb13d9c544713c299600ce62b321753c4b98f03369e9 +size 668490896 diff --git a/pytorch_model-00034-of-00082.bin b/pytorch_model-00034-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2391de0b4b48b010c30b76ecf93517c2ae2c19d2 --- /dev/null +++ b/pytorch_model-00034-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d881ebfef6c0f21c05c8d19a58dee4715b720f7448041aebd37c95c34d440eda +size 283116795 diff --git a/pytorch_model-00035-of-00082.bin b/pytorch_model-00035-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc00809e6501df48e2fa82ec58fdb4d34ed9899d --- /dev/null +++ b/pytorch_model-00035-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2ef122846e19d02044b0041b07d7f2ec8929654c3d21a7d64a126f3fb991d5 +size 668490896 diff --git a/pytorch_model-00036-of-00082.bin b/pytorch_model-00036-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..323cf0ebb49aac5ce575a1c29f8cbc05c7a2afc9 --- /dev/null +++ b/pytorch_model-00036-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d315936eb49804cd38444850a42a62b6f1190b55fff13d9a8ebd79abe0043045 +size 283116795 diff --git a/pytorch_model-00037-of-00082.bin b/pytorch_model-00037-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..40eff9646b8eedd0db8b274d3616f1d727405bd4 --- /dev/null +++ b/pytorch_model-00037-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc4bc39da45bb0572149dbbc83aab633316270a90222023c5d291ee79826816f +size 668490896 diff --git a/pytorch_model-00038-of-00082.bin b/pytorch_model-00038-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..0cc5eeb7a99c0672ca99496e44cebbfa40d42b80 --- /dev/null +++ b/pytorch_model-00038-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48a714ba461c060ef66cd735cf8096b1b097365e9538bde4369250c1f36d044 +size 283116795 diff --git a/pytorch_model-00039-of-00082.bin b/pytorch_model-00039-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..975f8e900c1cb5926957297fc9dd087525bf7f8e --- /dev/null +++ b/pytorch_model-00039-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f91ad897515ab0efaeb417752ac3f3031bdeaa198d2a748c58f8f96e007d9a03 +size 668490896 diff --git a/pytorch_model-00040-of-00082.bin b/pytorch_model-00040-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cde7a16ff10c2ef84dd3c07da31bf4ab1b69adc1 --- /dev/null +++ b/pytorch_model-00040-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b776517d136e5f14cb85f31e02a4c63e460d3e2eec62008e7de6ea236825ff51 +size 283116795 diff --git a/pytorch_model-00041-of-00082.bin b/pytorch_model-00041-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ae8670c5286fe3baadce6ae70ac72712b478f23 --- /dev/null +++ b/pytorch_model-00041-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9a19851fbe5da64c8bb410457f1cf81f934674bce851aed69c366b4d3cf54ab +size 668490896 diff --git a/pytorch_model-00042-of-00082.bin b/pytorch_model-00042-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0a47275068a00ee3447a45ec987f23e22a8e0ca --- /dev/null +++ b/pytorch_model-00042-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63fe9b47295b20f5c5a60bb36f5a6f6e314ebe57e34a4c430b0da3092179aa4 +size 283116795 diff --git a/pytorch_model-00043-of-00082.bin b/pytorch_model-00043-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..20344efbf3a87de75c394638115d180c97b7ec05 --- /dev/null +++ b/pytorch_model-00043-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d0b268e18f3c19dbdd05533dd20da5a4e976ab9b68c15679a82f8ee19ff92d +size 668490896 diff --git a/pytorch_model-00044-of-00082.bin b/pytorch_model-00044-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a20536dbe8a13b0031d74d8b520d1e863757bfe --- /dev/null +++ b/pytorch_model-00044-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f490f7529120107a27b4967fc45616554d7690ebfef90340bd78afe4f3dfc9c4 +size 283116795 diff --git a/pytorch_model-00045-of-00082.bin b/pytorch_model-00045-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b55c43cb467fb6cb1c0f566b709ac7bc4c39c30f --- /dev/null +++ b/pytorch_model-00045-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:febb0b2b479c1a00b70f2ad49053d5733e17c9bbe91ab0a7d8017a283137a273 +size 668490896 diff --git a/pytorch_model-00046-of-00082.bin b/pytorch_model-00046-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2661ad2b5e66b355dfbaaf0c7a190a792f3fb893 --- /dev/null +++ b/pytorch_model-00046-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963c52db583c853a94492302ed24175739788a8e506e8f6e10967d1c98fe49e7 +size 283116795 diff --git a/pytorch_model-00047-of-00082.bin b/pytorch_model-00047-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c85d85209b5bc8951bf3b011e99df7a4754578c --- /dev/null +++ b/pytorch_model-00047-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc6949be933035862f7cf368c544a3502544a24f500364681c646b35cf0bb82e +size 668490896 diff --git a/pytorch_model-00048-of-00082.bin b/pytorch_model-00048-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ebd44f8ab95a2a870c893359c9e2fdb6bb78be2 --- /dev/null +++ b/pytorch_model-00048-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e65b070c829a8a340fc527208e4a86642cbb4bce46c2df9dd3ad2b7dcede1a8 +size 283116795 diff --git a/pytorch_model-00049-of-00082.bin b/pytorch_model-00049-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c19eead2a1c8d01e00ab935b862e98fcb3b8dbe --- /dev/null +++ b/pytorch_model-00049-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e9ffcbbc2800af6e9bdc2f957487ba374280f4752ed9498016ad476616ba5c7 +size 668490896 diff --git a/pytorch_model-00050-of-00082.bin b/pytorch_model-00050-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..97c0d1b131331958d76d9cf7a06be78d215fa839 --- /dev/null +++ b/pytorch_model-00050-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a450672e6cbd1662afd63d5df8fdc8403b756660924981293a5b8914b1a0098 +size 283116795 diff --git a/pytorch_model-00051-of-00082.bin b/pytorch_model-00051-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e091b898651a5737d36cceffff296380af7c061d --- /dev/null +++ b/pytorch_model-00051-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55148622e53b0b7a773484bd1fadfcf66eac3a52d940787750b1f8857090363 +size 668490896 diff --git a/pytorch_model-00052-of-00082.bin b/pytorch_model-00052-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..68503a1007d7bc2cdc1eaddb559d4f9140e2f661 --- /dev/null +++ b/pytorch_model-00052-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37f281c2089e5df89852267702e03082654361db15e14eeb499d3f4d0ba641c +size 283116795 diff --git a/pytorch_model-00053-of-00082.bin b/pytorch_model-00053-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d55050722851fc6ce7b2d0659f6713cb796ffb63 --- /dev/null +++ b/pytorch_model-00053-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa80db2a0a94191edf1c0e0474337f80a47e3d74e252bf8b508db4fb9a98e71 +size 668490896 diff --git a/pytorch_model-00054-of-00082.bin b/pytorch_model-00054-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7e6272daa4ee027c0d50beb3ab31ed1ac31b92a --- /dev/null +++ b/pytorch_model-00054-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea497fd39a273ef3548d639029ee5dac5369c9234313ab5adb807e652c7ea88e +size 283116795 diff --git a/pytorch_model-00055-of-00082.bin b/pytorch_model-00055-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea2520d5d6e462749a7b8b52b527b089ed812006 --- /dev/null +++ b/pytorch_model-00055-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb5a435b3417938b86b33369c5d600cc6ef2f3fa888417c79ea22b0dea27605 +size 668490896 diff --git a/pytorch_model-00056-of-00082.bin b/pytorch_model-00056-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..292db6b253b2b8e1575cb6fc6902623ebbba8de7 --- /dev/null +++ b/pytorch_model-00056-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3516e224b00db94be2369cdb79a26252ef59d1035f882494f8eee3a7430803b +size 283116795 diff --git a/pytorch_model-00057-of-00082.bin b/pytorch_model-00057-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba139eee74bc9fb3dbe3dbae7e5ee4704a0271f3 --- /dev/null +++ b/pytorch_model-00057-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd1e270e2f3c44c56d03c8317b0fdbae7be640f44b8840d7befe186322e7696 +size 668490896 diff --git a/pytorch_model-00058-of-00082.bin b/pytorch_model-00058-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..634d5bbbc3480dc3d63d78049f1bd60805f29aa1 --- /dev/null +++ b/pytorch_model-00058-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0eaef3c37133f5398f5037e8ad0de1590cdd150ac27d5232187f513ff716be +size 283116795 diff --git a/pytorch_model-00059-of-00082.bin b/pytorch_model-00059-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b13ae82540d90a34caa9bdf7268b2a9e2f431afb --- /dev/null +++ b/pytorch_model-00059-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7107fc127260056b8dd99abd32ed20bc5e7cfe342cf135f35d7806a925773666 +size 668490896 diff --git a/pytorch_model-00060-of-00082.bin b/pytorch_model-00060-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..59041dae0c8794cd217762dd2fa672cbb700e30b --- /dev/null +++ b/pytorch_model-00060-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb609dbcf9246c840aad81709f99a941c91a996761770326f6827a2666649f6 +size 283116795 diff --git a/pytorch_model-00061-of-00082.bin b/pytorch_model-00061-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..95d08182fe7dc7144ba97beacd23861041ee157b --- /dev/null +++ b/pytorch_model-00061-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bbb30f56f9a295ea61560cb90a5de67c9343935e7d226f26773422c39c9aad1 +size 668490896 diff --git a/pytorch_model-00062-of-00082.bin b/pytorch_model-00062-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..bcd374814524160180a4d69e7bbbdb981e575aad --- /dev/null +++ b/pytorch_model-00062-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2404d8f80ec7c0a34d0a68c89ab7921bcfe3822ec0b3fcda57e46708ab6982 +size 283116795 diff --git a/pytorch_model-00063-of-00082.bin b/pytorch_model-00063-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..deff186e285340f8d8e58d06e141bb9d482be601 --- /dev/null +++ b/pytorch_model-00063-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48a4530770a341c6cfc927bf9ffd13422a194b26973626c9477ec1f3f981f09d +size 668490896 diff --git a/pytorch_model-00064-of-00082.bin b/pytorch_model-00064-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c6b7c399419d69ead21bc3c805991b13119323b --- /dev/null +++ b/pytorch_model-00064-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd16b03bb7c34197619ac71bce209ef1eba87748168a19894b222b6f0ca837de +size 283116795 diff --git a/pytorch_model-00065-of-00082.bin b/pytorch_model-00065-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3716616701ea1a22dd21e360dd7f9fd17a718c71 --- /dev/null +++ b/pytorch_model-00065-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:945d34b59ae08a8d716bffd240bfb25231f2ecc73f424600172def5cebc11e22 +size 668490896 diff --git a/pytorch_model-00066-of-00082.bin b/pytorch_model-00066-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..07f3512e6a4e8b6303618fb87983df0edff6d96e --- /dev/null +++ b/pytorch_model-00066-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:287b0055cd6c213d5537d297f39dee8238a9ac75e90c4ae2cd150b48b01eae37 +size 283116795 diff --git a/pytorch_model-00067-of-00082.bin b/pytorch_model-00067-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..a173bdb98971e5dacaa66a389f8c70c842cfed89 --- /dev/null +++ b/pytorch_model-00067-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efbd8460e0b19585126ef594de24beaf812866394b08e2656a16fd6a367b3e30 +size 668490896 diff --git a/pytorch_model-00068-of-00082.bin b/pytorch_model-00068-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e6ab793c98eb3cdb7b7c37d255258b999fd5b66 --- /dev/null +++ b/pytorch_model-00068-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8133dff37c97e3c787b596afcfee9187ccc4f98fc6a049f6ade30667ef0c5dc9 +size 283116795 diff --git a/pytorch_model-00069-of-00082.bin b/pytorch_model-00069-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4982f9fc60599a3748670c53848bafdc67157c9f --- /dev/null +++ b/pytorch_model-00069-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96af8feabb4386392bc6af989e54787f6351b27fe51e866d64de976c3aaa1b4 +size 668490896 diff --git a/pytorch_model-00070-of-00082.bin b/pytorch_model-00070-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9464b16867821776bb0b78fdc11c1e3e8608e39 --- /dev/null +++ b/pytorch_model-00070-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f09b9e414918496844673f7028e3be069fd2224d3f15c42b6390399ab9013b +size 283116795 diff --git a/pytorch_model-00071-of-00082.bin b/pytorch_model-00071-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb5b1ce28fbb59ddce6ddd936cf664e576c6b373 --- /dev/null +++ b/pytorch_model-00071-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f12a08aa58f18e2504904f4eb0d56baef6b41b0728252298b625329f77b56c +size 668490896 diff --git a/pytorch_model-00072-of-00082.bin b/pytorch_model-00072-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e5d3eb6ca30f1d22751da7b86eb652c8fc448cb --- /dev/null +++ b/pytorch_model-00072-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87b432946a6195b4f93f0c0c3045f38541c6254e782098bef4cda8c1387989b1 +size 283116795 diff --git a/pytorch_model-00073-of-00082.bin b/pytorch_model-00073-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fdec652fb5ec8ed22727a7047635f4fa449a52f6 --- /dev/null +++ b/pytorch_model-00073-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dec4e6cb97e1cc520ad7fedddd51f9ad805c315cfcc2ce9433efc21ca1f8f393 +size 668490896 diff --git a/pytorch_model-00074-of-00082.bin b/pytorch_model-00074-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8f73ce9cdd14464e71ad4f6e1392cde8debd202 --- /dev/null +++ b/pytorch_model-00074-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224ea5ebc9d1868d5f40ca08d85c4070542d4be11b3d638893d3e6a9aeeac402 +size 283116795 diff --git a/pytorch_model-00075-of-00082.bin b/pytorch_model-00075-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..216b05ad61aeedcf04afa39bce2b440522c91159 --- /dev/null +++ b/pytorch_model-00075-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb6f42c9cd8d5c2b6c60465b2c958698173527d954b46ddf9ac9178bde7aad2 +size 668490896 diff --git a/pytorch_model-00076-of-00082.bin b/pytorch_model-00076-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..976473a25e230e342101b10d577567e06ffb5f38 --- /dev/null +++ b/pytorch_model-00076-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9355f4cdef3c2e54f8da6b5afe4bc229be89492f6a4ea5edeecaadc32441f7c5 +size 283116795 diff --git a/pytorch_model-00077-of-00082.bin b/pytorch_model-00077-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d6969459e1d9621ed0a6ed13409aa22cdacace02 --- /dev/null +++ b/pytorch_model-00077-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce51a1537d07f4db6668090fc8049b502241f7556cc5615debcaaf6646d73c34 +size 668490896 diff --git a/pytorch_model-00078-of-00082.bin b/pytorch_model-00078-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8434c1b4df43d646559b7131693a8e943c6c4a2 --- /dev/null +++ b/pytorch_model-00078-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6e8e8a506ac480b7663483317f9562fdb5b8ffcda6c4442927b40fe614d9bd +size 283116795 diff --git a/pytorch_model-00079-of-00082.bin b/pytorch_model-00079-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2c7db185acf8bd5ec24b406b9748d6d2eb0edab --- /dev/null +++ b/pytorch_model-00079-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d536821daf308fba127fb474ece91bb52ef4381fa9a57eae620180475a49c9a4 +size 668490896 diff --git a/pytorch_model-00080-of-00082.bin b/pytorch_model-00080-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fedf94e52ef9bb07e67d0abee14db0b30ab7c86e --- /dev/null +++ b/pytorch_model-00080-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153c78065e32366f6aaabb34f329a70bbbd6ae0cd668076f6d60230666852a54 +size 283116795 diff --git a/pytorch_model-00081-of-00082.bin b/pytorch_model-00081-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e26932c2da17992ab465f0c5acf341e5b8431bc5 --- /dev/null +++ b/pytorch_model-00081-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45576a40edbfc363b894ddf5d279fe0f9108fe038eefec0edc4b4ac9113c1e8a +size 786464332 diff --git a/pytorch_model-00082-of-00082.bin b/pytorch_model-00082-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..aeadcc189df9d810b2dc9587b9fa7da6fa711b3d --- /dev/null +++ b/pytorch_model-00082-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97114576d6423820ea4a95b4fbf2f646d519765dc3b7d849363b476254b9a3ba +size 327680938 diff --git a/pytorch_model.bin.index.json b/pytorch_model.bin.index.json new file mode 100644 index 0000000000000000000000000000000000000000..e684cedb1a653453ef5bec1df2994064d057ee48 --- /dev/null +++ b/pytorch_model.bin.index.json @@ -0,0 +1,410 @@ +{ + "metadata": { + "total_size": 26031738880 + }, + "weight_map": { + "lm_head.weight": "pytorch_model-00082-of-00082.bin", + "model.embed_tokens.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.input_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.down_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.gate_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.mlp.up_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.post_attention_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.self_attn.k_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.o_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.q_proj.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.self_attn.rotary_emb.inv_freq": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.v_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.1.input_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.mlp.down_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.gate_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.up_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.post_attention_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.self_attn.k_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.o_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.q_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.rotary_emb.inv_freq": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.v_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.10.input_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.mlp.down_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.gate_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.up_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.post_attention_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.self_attn.k_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.o_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.q_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.rotary_emb.inv_freq": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.v_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.11.input_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.mlp.down_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.gate_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.up_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.post_attention_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.self_attn.k_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.o_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.q_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.rotary_emb.inv_freq": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.v_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.12.input_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.mlp.down_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.gate_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.up_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.post_attention_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.self_attn.k_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.o_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.q_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.rotary_emb.inv_freq": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.v_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.13.input_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.mlp.down_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.gate_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.up_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.post_attention_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.self_attn.k_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.o_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.q_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.rotary_emb.inv_freq": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.v_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.14.input_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.mlp.down_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.gate_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.up_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.post_attention_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.self_attn.k_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.o_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.q_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.rotary_emb.inv_freq": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.v_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.15.input_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.mlp.down_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.gate_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.up_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.post_attention_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.self_attn.k_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.o_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.q_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.rotary_emb.inv_freq": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.v_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.16.input_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.mlp.down_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.gate_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.up_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.post_attention_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.self_attn.k_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.o_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.q_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.rotary_emb.inv_freq": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.v_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.17.input_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.mlp.down_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.gate_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.up_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.post_attention_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.self_attn.k_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.o_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.q_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.rotary_emb.inv_freq": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.v_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.18.input_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.mlp.down_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.gate_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.up_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.post_attention_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.self_attn.k_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.o_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.q_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.rotary_emb.inv_freq": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.v_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.19.input_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.mlp.down_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.gate_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.up_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.post_attention_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.self_attn.k_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.o_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.q_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.rotary_emb.inv_freq": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.v_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.2.input_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.mlp.down_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.gate_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.up_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.post_attention_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.self_attn.k_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.o_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.q_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.rotary_emb.inv_freq": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.v_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.20.input_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.mlp.down_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.gate_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.up_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.post_attention_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.self_attn.k_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.o_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.q_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.rotary_emb.inv_freq": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.v_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.21.input_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.mlp.down_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.gate_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.up_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.post_attention_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.self_attn.k_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.o_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.q_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.rotary_emb.inv_freq": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.v_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.22.input_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.mlp.down_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.gate_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.up_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.post_attention_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.self_attn.k_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.rotary_emb.inv_freq": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.23.input_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.mlp.down_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.up_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.rotary_emb.inv_freq": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.v_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.24.input_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.mlp.down_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.gate_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.up_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.post_attention_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.self_attn.k_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.o_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.q_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.rotary_emb.inv_freq": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.v_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.25.input_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.mlp.down_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.gate_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.up_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.post_attention_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.self_attn.k_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.o_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.q_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.rotary_emb.inv_freq": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.v_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.26.input_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.mlp.down_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.gate_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.up_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.post_attention_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.self_attn.k_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.o_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.q_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.rotary_emb.inv_freq": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.v_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.27.input_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.mlp.down_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.gate_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.up_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.post_attention_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.self_attn.k_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.o_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.q_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.rotary_emb.inv_freq": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.v_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.28.input_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.mlp.down_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.gate_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.up_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.post_attention_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.self_attn.k_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.o_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.q_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.rotary_emb.inv_freq": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.v_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.29.input_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.mlp.down_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.gate_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.up_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.post_attention_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.self_attn.k_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.o_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.q_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.rotary_emb.inv_freq": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.v_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.3.input_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.mlp.down_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.gate_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.up_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.post_attention_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.self_attn.k_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.o_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.q_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.rotary_emb.inv_freq": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.v_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.30.input_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.mlp.down_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.gate_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.up_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.post_attention_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.self_attn.k_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.o_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.q_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.rotary_emb.inv_freq": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.v_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.31.input_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.mlp.down_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.gate_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.up_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.post_attention_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.self_attn.k_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.o_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.q_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.rotary_emb.inv_freq": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.v_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.32.input_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.mlp.down_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.gate_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.up_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.post_attention_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.self_attn.k_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.o_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.q_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.rotary_emb.inv_freq": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.v_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.33.input_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.mlp.down_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.gate_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.up_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.post_attention_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.self_attn.k_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.o_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.q_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.rotary_emb.inv_freq": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.v_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.34.input_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.mlp.down_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.gate_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.up_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.post_attention_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.self_attn.k_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.o_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.q_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.rotary_emb.inv_freq": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.v_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.35.input_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.mlp.down_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.gate_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.up_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.post_attention_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.self_attn.k_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.o_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.q_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.rotary_emb.inv_freq": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.v_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.36.input_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.mlp.down_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.gate_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.up_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.post_attention_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.self_attn.k_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.o_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.q_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.rotary_emb.inv_freq": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.v_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.37.input_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.mlp.down_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.gate_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.up_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.post_attention_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.self_attn.k_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.o_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.q_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.rotary_emb.inv_freq": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.v_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.38.input_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.mlp.down_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.gate_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.up_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.post_attention_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.self_attn.k_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.o_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.q_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.rotary_emb.inv_freq": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.v_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.39.input_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.mlp.down_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.gate_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.up_proj.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.post_attention_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.self_attn.k_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.o_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.q_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.rotary_emb.inv_freq": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.v_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.4.input_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.mlp.down_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.gate_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.up_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.post_attention_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.self_attn.k_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.o_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.q_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.rotary_emb.inv_freq": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.v_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.5.input_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.mlp.down_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.gate_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.up_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.post_attention_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.self_attn.k_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.o_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.q_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.rotary_emb.inv_freq": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.v_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.6.input_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.mlp.down_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.gate_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.up_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.post_attention_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.self_attn.k_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.o_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.q_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.rotary_emb.inv_freq": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.v_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.7.input_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.mlp.down_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.gate_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.up_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.post_attention_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.self_attn.k_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.o_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.q_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.rotary_emb.inv_freq": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.v_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.8.input_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.mlp.down_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.gate_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.up_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.post_attention_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.self_attn.k_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.o_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.q_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.rotary_emb.inv_freq": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.v_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.9.input_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.mlp.down_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.gate_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.up_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.post_attention_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.self_attn.k_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.o_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.q_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.rotary_emb.inv_freq": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.v_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.norm.weight": "pytorch_model-00081-of-00082.bin" + } +}