diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2f548d0957475f529cd632501d1ebdf1813bafae --- /dev/null +++ b/config.json @@ -0,0 +1,23 @@ +{ + "_name_or_path": "decapoda-research/llama-13b-hf", + "architectures": [ + "LlamaForCausalLM" + ], + "bos_token_id": 0, + "eos_token_id": 1, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "intermediate_size": 13824, + "max_sequence_length": 2048, + "model_type": "llama", + "num_attention_heads": 40, + "num_hidden_layers": 40, + "pad_token_id": -1, + "rms_norm_eps": 1e-06, + "tie_word_embeddings": false, + "torch_dtype": "float16", + "transformers_version": "4.28.0.dev0", + "use_cache": true, + "vocab_size": 32000 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..128b48946713166edcc3e3c62ae5fe285df776be --- /dev/null +++ b/generation_config.json @@ -0,0 +1,7 @@ +{ + "_from_model_config": true, + "bos_token_id": 0, + "eos_token_id": 1, + "pad_token_id": 0, + "transformers_version": "4.28.0.dev0" +} diff --git a/pytorch_model-00001-of-00082.bin b/pytorch_model-00001-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7e93e18e7367f8e68243bf64b39b83098a571eb --- /dev/null +++ b/pytorch_model-00001-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07c7ba895f89e1af14a5e66a58458abc78d94fc91ca394edb530d1d3f247f0b +size 380110075 diff --git a/pytorch_model-00002-of-00082.bin b/pytorch_model-00002-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4cc4e0a818ec5f6e51a543cd0ed44a6cb6daffc2 --- /dev/null +++ b/pytorch_model-00002-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b0aee32ee10e3b318e270462f57e114cf076029fe4c9edaa005ff0ac1a8c6e7 +size 298846638 diff --git a/pytorch_model-00003-of-00082.bin b/pytorch_model-00003-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d2f59b3c4d8d4ca7cfcc21221c2459d6b0715462 --- /dev/null +++ b/pytorch_model-00003-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa9413cba6cbd37791ff41162a1983b267e0b01444c1570dd31293e983237e34 +size 705190126 diff --git a/pytorch_model-00004-of-00082.bin b/pytorch_model-00004-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac6d8cad36b64e498c8f4c0abfface69315af7db --- /dev/null +++ b/pytorch_model-00004-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e56f6d0e73f87777167c6d267f8cc78aefda0e1ee086a185ff943a3d95aaedc8 +size 387975598 diff --git a/pytorch_model-00005-of-00082.bin b/pytorch_model-00005-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f63c543679ef775349697ed996c19bdbe20ed15a --- /dev/null +++ b/pytorch_model-00005-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9080d2f8e3a57234df54b969dae0ddf6557f3d4a3d75cff9fc6e14fdec30923b +size 668490896 diff --git a/pytorch_model-00006-of-00082.bin b/pytorch_model-00006-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..357a8e07dc9f069a793a4cb5c772dc927222dd27 --- /dev/null +++ b/pytorch_model-00006-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc1c552640ca98eb953174f314be35003e7d0a83cd66876dfc2503213d47599 +size 283116795 diff --git a/pytorch_model-00007-of-00082.bin b/pytorch_model-00007-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b61c5081cf3138cac1eb6a82944e89f0cc2414f --- /dev/null +++ b/pytorch_model-00007-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a17aa23bc9e5fe3ac6fecc20998d7677d22824bd8a3db787d229aeb885a6c653 +size 668490896 diff --git a/pytorch_model-00008-of-00082.bin b/pytorch_model-00008-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8677493c4cd36c57b2e669f2567150c869840cbc --- /dev/null +++ b/pytorch_model-00008-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d80edfca8890f5fa22322cd6a7a074cf8ac967766693d97adc3169ea734ad75 +size 283116795 diff --git a/pytorch_model-00009-of-00082.bin b/pytorch_model-00009-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..70e4cad9f23314095909af2a6e9376066354344e --- /dev/null +++ b/pytorch_model-00009-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cc50610ce0927a2dc7392c5320a8d734103779b9dd717c1327dd00f7369fd1b +size 668490896 diff --git a/pytorch_model-00010-of-00082.bin b/pytorch_model-00010-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d03ddd77c776a7649998f759a802c0e1288c0282 --- /dev/null +++ b/pytorch_model-00010-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e29f91a92127ef330e71f0f664b8d3ada8526427ed6ef8a85efd6a668b8f60 +size 283116795 diff --git a/pytorch_model-00011-of-00082.bin b/pytorch_model-00011-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7cdc7122c0b50128edf4a7541e5d5944cfc81fae --- /dev/null +++ b/pytorch_model-00011-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f029c25a7fffa560b77c5194c958bfb41b9ef0f6000e829e24e9b2411c89370 +size 668490896 diff --git a/pytorch_model-00012-of-00082.bin b/pytorch_model-00012-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dc44cc388c43ef7552244a052ad564c31739a0a --- /dev/null +++ b/pytorch_model-00012-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26136f021a572bc5545c45366793f328b27ba7a817169e882ee43512ed920986 +size 283116795 diff --git a/pytorch_model-00013-of-00082.bin b/pytorch_model-00013-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2b0c3faf38eea84647a4c144d2830c5d196a06c --- /dev/null +++ b/pytorch_model-00013-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:305c31b190878f8c88539442ad6c61d5a97f765a77d3e989595cbaee1d26b353 +size 668490896 diff --git a/pytorch_model-00014-of-00082.bin b/pytorch_model-00014-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f76074b851a2e0adb596955f2cebbf4624d6d176 --- /dev/null +++ b/pytorch_model-00014-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad550ac7984955710c3aef53b3cf44b675736373cced6bdde2c10bd90fd05e00 +size 283116795 diff --git a/pytorch_model-00015-of-00082.bin b/pytorch_model-00015-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..802f92eb7613a6a91a7ad9fd427da15bb009872f --- /dev/null +++ b/pytorch_model-00015-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d846556ebc70813d7142e10bb724c26456fa723e399de232e81e3d41bff393a9 +size 668490896 diff --git a/pytorch_model-00016-of-00082.bin b/pytorch_model-00016-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..10ee4d4ffbd2be738c61b5d2955e77e90b648284 --- /dev/null +++ b/pytorch_model-00016-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8291046bbb599b31c293ce23e3174a87834c97e765d37aff394a8227c120ffcb +size 283116795 diff --git a/pytorch_model-00017-of-00082.bin b/pytorch_model-00017-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cad478617893e8e7f2552ba4b6bc1c5db21fdfe6 --- /dev/null +++ b/pytorch_model-00017-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d8e35af4ee5aac0fea17a2ffe1d9ac78186ecf09a89251bea0558e48cf265be +size 668490896 diff --git a/pytorch_model-00018-of-00082.bin b/pytorch_model-00018-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e6e67161e363674e5933b9ebc814b107e6e76d1 --- /dev/null +++ b/pytorch_model-00018-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25c2a779547ff1bfea36dd16d6ce68844d784c3594f502aa8279723fbb54bfc +size 283116795 diff --git a/pytorch_model-00019-of-00082.bin b/pytorch_model-00019-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..98487b0ba0bb6eae13364ad98bf9e21ba6e8c3c0 --- /dev/null +++ b/pytorch_model-00019-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19ad505aec78f502e8cec3868bede5151dfa32e7ca676b757d8efcbe62d71511 +size 668490896 diff --git a/pytorch_model-00020-of-00082.bin b/pytorch_model-00020-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..edfb3fbb39b468301570d6f86d87706d92294cd7 --- /dev/null +++ b/pytorch_model-00020-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf8ba21239f070b3dddf08b428a032ec1a0f0b97adf91d614db67685b8a2f3c +size 283116795 diff --git a/pytorch_model-00021-of-00082.bin b/pytorch_model-00021-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f27526eb21e9231b764e7b978b46cfa6095995c1 --- /dev/null +++ b/pytorch_model-00021-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3abb4a5de6a8f0e3aceab0993992d39dc6ae72a0bc99a97aece8944de8963bb2 +size 668490896 diff --git a/pytorch_model-00022-of-00082.bin b/pytorch_model-00022-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..08e30781089efed1fc42331db4943b7eec37c22d --- /dev/null +++ b/pytorch_model-00022-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c538c86a2cb6f36a03ee39afeb1fbd580c169b6d25b27108e3a6539b68cd8f1 +size 283116795 diff --git a/pytorch_model-00023-of-00082.bin b/pytorch_model-00023-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..24f0266186084481b3c2fc6c3cf67389b6462760 --- /dev/null +++ b/pytorch_model-00023-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1efee51bf3ca8a59d2fbd442f31a66bf7e46c3820d167b4a3f5e7bdf3f6ca9 +size 668490896 diff --git a/pytorch_model-00024-of-00082.bin b/pytorch_model-00024-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad36a39e79b2883251924da5f297a8870441a325 --- /dev/null +++ b/pytorch_model-00024-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6591f1b2560ba2159919148ccd3d14edc04503f2d006ed1b15b57c57f626e9e9 +size 283116795 diff --git a/pytorch_model-00025-of-00082.bin b/pytorch_model-00025-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..dfae9f829be3a13d9d773025e55c9d18d5f2c657 --- /dev/null +++ b/pytorch_model-00025-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e390b2c9c7de5d46ca23e3b9a38a2ce9c2ad1bc34f021d3deb107e777dc4bdaa +size 668490896 diff --git a/pytorch_model-00026-of-00082.bin b/pytorch_model-00026-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b1d3ef696bb24a46397b4b177c482422026f37b --- /dev/null +++ b/pytorch_model-00026-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eee6652908ce206baf7357d9f5d8ad301a8f8d79428aec99ef7dec3b32e646 +size 283116795 diff --git a/pytorch_model-00027-of-00082.bin b/pytorch_model-00027-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..36b47489dfef19115ed430b337628230405721e9 --- /dev/null +++ b/pytorch_model-00027-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb693a643d231df7dfffeefb28dc554ac2116754db509df383d2ca20e72999a +size 668490896 diff --git a/pytorch_model-00028-of-00082.bin b/pytorch_model-00028-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8bc06c4502866ee765ff1742345d92fd8a518579 --- /dev/null +++ b/pytorch_model-00028-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4242a2a58ee759158f020d7164b669b278a82c23eba7c40ba9e25068c2b91ce +size 283116795 diff --git a/pytorch_model-00029-of-00082.bin b/pytorch_model-00029-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7d745d8d178a5cd01b3903c555a192b0885c158d --- /dev/null +++ b/pytorch_model-00029-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57e104b23f61b46920282a8c8f7e2a44becd57d4a2925fa1d49b22aedcd52e38 +size 668490896 diff --git a/pytorch_model-00030-of-00082.bin b/pytorch_model-00030-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..008b4aa2912bc378c15b46bafc75976237f22116 --- /dev/null +++ b/pytorch_model-00030-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1dc8c99a219094b4464fa6c4e7d16de5851ed53b1a94444c6f8045a5ebef9a +size 283116795 diff --git a/pytorch_model-00031-of-00082.bin b/pytorch_model-00031-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3148b88eb4865cdc3315251f474e9d2255681db8 --- /dev/null +++ b/pytorch_model-00031-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04154c1fc8803ffa8fad8fb8869ce9ac92d240e9ea8a0a307adc554d8b0b5790 +size 668490896 diff --git a/pytorch_model-00032-of-00082.bin b/pytorch_model-00032-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa184fc30de69e72b83ada5d64de91de9c5af5ee --- /dev/null +++ b/pytorch_model-00032-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d21051227d43ddb58ae705034715939d70ada16a19c8d009003779174b62ad7 +size 283116795 diff --git a/pytorch_model-00033-of-00082.bin b/pytorch_model-00033-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..18fddb2488e9713adc31eae0de6569734b80d8ef --- /dev/null +++ b/pytorch_model-00033-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c8891f1cd9a7f56b0d5eed8bbabbcdf6eb04b85f9b634ad62f8703e8a45180 +size 668490896 diff --git a/pytorch_model-00034-of-00082.bin b/pytorch_model-00034-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2391de0b4b48b010c30b76ecf93517c2ae2c19d2 --- /dev/null +++ b/pytorch_model-00034-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d881ebfef6c0f21c05c8d19a58dee4715b720f7448041aebd37c95c34d440eda +size 283116795 diff --git a/pytorch_model-00035-of-00082.bin b/pytorch_model-00035-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..a80fd067ec2e7dab70020d6b190422dcf2180440 --- /dev/null +++ b/pytorch_model-00035-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e98ecf1ee97a200339c26df2e0e8d7c6ce8ede01ddffde3c6e6bd216595fc8 +size 668490896 diff --git a/pytorch_model-00036-of-00082.bin b/pytorch_model-00036-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..323cf0ebb49aac5ce575a1c29f8cbc05c7a2afc9 --- /dev/null +++ b/pytorch_model-00036-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d315936eb49804cd38444850a42a62b6f1190b55fff13d9a8ebd79abe0043045 +size 283116795 diff --git a/pytorch_model-00037-of-00082.bin b/pytorch_model-00037-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..0678b0b0023ad122cb89e075dceb5674f4fe1bb3 --- /dev/null +++ b/pytorch_model-00037-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95cd533cab82853ab893ace20b7779969741d98725b8d86a84e3e547a78b652f +size 668490896 diff --git a/pytorch_model-00038-of-00082.bin b/pytorch_model-00038-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..0cc5eeb7a99c0672ca99496e44cebbfa40d42b80 --- /dev/null +++ b/pytorch_model-00038-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48a714ba461c060ef66cd735cf8096b1b097365e9538bde4369250c1f36d044 +size 283116795 diff --git a/pytorch_model-00039-of-00082.bin b/pytorch_model-00039-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..24ed10f593c3bc8b2ed589f579419ab719287c60 --- /dev/null +++ b/pytorch_model-00039-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85e80a568f6b01170d07360204a9cefe021b321ceb23eb729eaf0d7a468a4665 +size 668490896 diff --git a/pytorch_model-00040-of-00082.bin b/pytorch_model-00040-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cde7a16ff10c2ef84dd3c07da31bf4ab1b69adc1 --- /dev/null +++ b/pytorch_model-00040-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b776517d136e5f14cb85f31e02a4c63e460d3e2eec62008e7de6ea236825ff51 +size 283116795 diff --git a/pytorch_model-00041-of-00082.bin b/pytorch_model-00041-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f69b14f036be19622c6833266429f32ead7e1431 --- /dev/null +++ b/pytorch_model-00041-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90e1a00528c0a52e2a715ca9722d733bc3a5f5d3c1e904b6f1ad6b3cf1e44fcd +size 668490896 diff --git a/pytorch_model-00042-of-00082.bin b/pytorch_model-00042-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0a47275068a00ee3447a45ec987f23e22a8e0ca --- /dev/null +++ b/pytorch_model-00042-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63fe9b47295b20f5c5a60bb36f5a6f6e314ebe57e34a4c430b0da3092179aa4 +size 283116795 diff --git a/pytorch_model-00043-of-00082.bin b/pytorch_model-00043-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f7e3c075b0493903037941ddcf4ac7d80fb3ad8 --- /dev/null +++ b/pytorch_model-00043-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1151d9ae83904e7c5f82da3191fe3ab1d2319fbeeace7a4804ea76224acbb75b +size 668490896 diff --git a/pytorch_model-00044-of-00082.bin b/pytorch_model-00044-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a20536dbe8a13b0031d74d8b520d1e863757bfe --- /dev/null +++ b/pytorch_model-00044-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f490f7529120107a27b4967fc45616554d7690ebfef90340bd78afe4f3dfc9c4 +size 283116795 diff --git a/pytorch_model-00045-of-00082.bin b/pytorch_model-00045-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..96293452c13c4a934a9d73c6a419e2cfe698aed8 --- /dev/null +++ b/pytorch_model-00045-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e6bb639437f38a344080213ace87b5d8bf605a661d80f2060aa596a5ac79af2 +size 668490896 diff --git a/pytorch_model-00046-of-00082.bin b/pytorch_model-00046-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2661ad2b5e66b355dfbaaf0c7a190a792f3fb893 --- /dev/null +++ b/pytorch_model-00046-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963c52db583c853a94492302ed24175739788a8e506e8f6e10967d1c98fe49e7 +size 283116795 diff --git a/pytorch_model-00047-of-00082.bin b/pytorch_model-00047-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..972756ea660a755cccbcbb8ccdb78dc776f43d2d --- /dev/null +++ b/pytorch_model-00047-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:828f9db62af4ba9213dbb45c1d58eb05882084100d9ba95f976a0a4e5efafb0e +size 668490896 diff --git a/pytorch_model-00048-of-00082.bin b/pytorch_model-00048-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ebd44f8ab95a2a870c893359c9e2fdb6bb78be2 --- /dev/null +++ b/pytorch_model-00048-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e65b070c829a8a340fc527208e4a86642cbb4bce46c2df9dd3ad2b7dcede1a8 +size 283116795 diff --git a/pytorch_model-00049-of-00082.bin b/pytorch_model-00049-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..a00b0757c22540f81160ba11f9b7fc388fd7c360 --- /dev/null +++ b/pytorch_model-00049-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82f33c0cb2f375a30e1ea14e7bcd0bae55b144d35ba052d33bbc0a0ee2425312 +size 668490896 diff --git a/pytorch_model-00050-of-00082.bin b/pytorch_model-00050-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..97c0d1b131331958d76d9cf7a06be78d215fa839 --- /dev/null +++ b/pytorch_model-00050-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a450672e6cbd1662afd63d5df8fdc8403b756660924981293a5b8914b1a0098 +size 283116795 diff --git a/pytorch_model-00051-of-00082.bin b/pytorch_model-00051-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2737f0a72a66e3a8b2af04e0f7750cccef722750 --- /dev/null +++ b/pytorch_model-00051-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d35b8dff552180789996449c00a9d88cc07e863bfc53ee5ec361ac92dd2b063 +size 668490896 diff --git a/pytorch_model-00052-of-00082.bin b/pytorch_model-00052-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..68503a1007d7bc2cdc1eaddb559d4f9140e2f661 --- /dev/null +++ b/pytorch_model-00052-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37f281c2089e5df89852267702e03082654361db15e14eeb499d3f4d0ba641c +size 283116795 diff --git a/pytorch_model-00053-of-00082.bin b/pytorch_model-00053-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..da91ed7feb97b9c9687991ba214c597870e8e055 --- /dev/null +++ b/pytorch_model-00053-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f72e6cfc2288d51763dbbc02cfd1ddb627e30cf077ea1af9743c2b325cd5103d +size 668490896 diff --git a/pytorch_model-00054-of-00082.bin b/pytorch_model-00054-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7e6272daa4ee027c0d50beb3ab31ed1ac31b92a --- /dev/null +++ b/pytorch_model-00054-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea497fd39a273ef3548d639029ee5dac5369c9234313ab5adb807e652c7ea88e +size 283116795 diff --git a/pytorch_model-00055-of-00082.bin b/pytorch_model-00055-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b1537e2107430dccc6406d4a1948e592b824e2b2 --- /dev/null +++ b/pytorch_model-00055-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e12d353c157f27fffec3d8b3b101ef7a44c43189cbef4e082d95bebcefa62fc +size 668490896 diff --git a/pytorch_model-00056-of-00082.bin b/pytorch_model-00056-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..292db6b253b2b8e1575cb6fc6902623ebbba8de7 --- /dev/null +++ b/pytorch_model-00056-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3516e224b00db94be2369cdb79a26252ef59d1035f882494f8eee3a7430803b +size 283116795 diff --git a/pytorch_model-00057-of-00082.bin b/pytorch_model-00057-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b798f27a1a3a645613a82d41f9a221eaa4d17117 --- /dev/null +++ b/pytorch_model-00057-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9778e7087c0413866a1f4a450c9901db13e1d08bab246cc7d2afc5ab53ca5c95 +size 668490896 diff --git a/pytorch_model-00058-of-00082.bin b/pytorch_model-00058-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..634d5bbbc3480dc3d63d78049f1bd60805f29aa1 --- /dev/null +++ b/pytorch_model-00058-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0eaef3c37133f5398f5037e8ad0de1590cdd150ac27d5232187f513ff716be +size 283116795 diff --git a/pytorch_model-00059-of-00082.bin b/pytorch_model-00059-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..392017bb30558ab8b7b869bbf542b58ba689c038 --- /dev/null +++ b/pytorch_model-00059-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1c3bfcac457511fa10e5b362127f21061c7bb1a1542f5a7c3de3a4ba77964a +size 668490896 diff --git a/pytorch_model-00060-of-00082.bin b/pytorch_model-00060-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..59041dae0c8794cd217762dd2fa672cbb700e30b --- /dev/null +++ b/pytorch_model-00060-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb609dbcf9246c840aad81709f99a941c91a996761770326f6827a2666649f6 +size 283116795 diff --git a/pytorch_model-00061-of-00082.bin b/pytorch_model-00061-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..be505821160684dc60853b8b86efec0788d6e93e --- /dev/null +++ b/pytorch_model-00061-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61068aaca587f04a3a05baf589c4a2681743667397219bbbf4003139c6677ebe +size 668490896 diff --git a/pytorch_model-00062-of-00082.bin b/pytorch_model-00062-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..bcd374814524160180a4d69e7bbbdb981e575aad --- /dev/null +++ b/pytorch_model-00062-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2404d8f80ec7c0a34d0a68c89ab7921bcfe3822ec0b3fcda57e46708ab6982 +size 283116795 diff --git a/pytorch_model-00063-of-00082.bin b/pytorch_model-00063-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..314d9e63021b9e8b5675f1fea1e8505a80dfd457 --- /dev/null +++ b/pytorch_model-00063-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a07f3f53052367898b15b0ee4426eb93fe8db7c3856f265fbc6fbb210d35c9ee +size 668490896 diff --git a/pytorch_model-00064-of-00082.bin b/pytorch_model-00064-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c6b7c399419d69ead21bc3c805991b13119323b --- /dev/null +++ b/pytorch_model-00064-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd16b03bb7c34197619ac71bce209ef1eba87748168a19894b222b6f0ca837de +size 283116795 diff --git a/pytorch_model-00065-of-00082.bin b/pytorch_model-00065-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..39ddb7f38fa5a36560cea1a8f51fbfa011240865 --- /dev/null +++ b/pytorch_model-00065-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7a47d0d38143f32124d9a3fd7c3501a756002878969bc1d9d0dada3393ecaa +size 668490896 diff --git a/pytorch_model-00066-of-00082.bin b/pytorch_model-00066-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..07f3512e6a4e8b6303618fb87983df0edff6d96e --- /dev/null +++ b/pytorch_model-00066-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:287b0055cd6c213d5537d297f39dee8238a9ac75e90c4ae2cd150b48b01eae37 +size 283116795 diff --git a/pytorch_model-00067-of-00082.bin b/pytorch_model-00067-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cacf90023cbeebadc600fb71a04285131c4da768 --- /dev/null +++ b/pytorch_model-00067-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16252cf921118d6687f3d52a8d9d966cc5e98bff42eb8ebc0e081e3c7406daf0 +size 668490896 diff --git a/pytorch_model-00068-of-00082.bin b/pytorch_model-00068-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e6ab793c98eb3cdb7b7c37d255258b999fd5b66 --- /dev/null +++ b/pytorch_model-00068-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8133dff37c97e3c787b596afcfee9187ccc4f98fc6a049f6ade30667ef0c5dc9 +size 283116795 diff --git a/pytorch_model-00069-of-00082.bin b/pytorch_model-00069-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5d674cc6ae0152319fd8d8549cbe0c42906a6521 --- /dev/null +++ b/pytorch_model-00069-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70eedc51661d476ace01d6ad3b799ee786a2f268ad8e3155a7f990e6c817b30c +size 668490896 diff --git a/pytorch_model-00070-of-00082.bin b/pytorch_model-00070-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9464b16867821776bb0b78fdc11c1e3e8608e39 --- /dev/null +++ b/pytorch_model-00070-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f09b9e414918496844673f7028e3be069fd2224d3f15c42b6390399ab9013b +size 283116795 diff --git a/pytorch_model-00071-of-00082.bin b/pytorch_model-00071-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f6ba7d8699d421cdfd38f643b1c18be8def0404 --- /dev/null +++ b/pytorch_model-00071-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:745b5dee85bf294cec15a9c8ec5ba085e0532f47a4c54f18f489b6e033445a97 +size 668490896 diff --git a/pytorch_model-00072-of-00082.bin b/pytorch_model-00072-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e5d3eb6ca30f1d22751da7b86eb652c8fc448cb --- /dev/null +++ b/pytorch_model-00072-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87b432946a6195b4f93f0c0c3045f38541c6254e782098bef4cda8c1387989b1 +size 283116795 diff --git a/pytorch_model-00073-of-00082.bin b/pytorch_model-00073-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8af4a4cb579b513acba27a27a5501c817ec1cd5 --- /dev/null +++ b/pytorch_model-00073-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e14d781c7f8fa7714d55813ac05f68a801ca0428f8d576750d76f82b5cb4a9e +size 668490896 diff --git a/pytorch_model-00074-of-00082.bin b/pytorch_model-00074-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8f73ce9cdd14464e71ad4f6e1392cde8debd202 --- /dev/null +++ b/pytorch_model-00074-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224ea5ebc9d1868d5f40ca08d85c4070542d4be11b3d638893d3e6a9aeeac402 +size 283116795 diff --git a/pytorch_model-00075-of-00082.bin b/pytorch_model-00075-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2df1d565f246dc3e049fd68712e4bfc8fe626072 --- /dev/null +++ b/pytorch_model-00075-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6321d3b5cfc03bee9e706d10a2f33ed58dd27223fe25b30573475ffd1d1ee209 +size 668490896 diff --git a/pytorch_model-00076-of-00082.bin b/pytorch_model-00076-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..976473a25e230e342101b10d577567e06ffb5f38 --- /dev/null +++ b/pytorch_model-00076-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9355f4cdef3c2e54f8da6b5afe4bc229be89492f6a4ea5edeecaadc32441f7c5 +size 283116795 diff --git a/pytorch_model-00077-of-00082.bin b/pytorch_model-00077-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..91a5b138f5a1e2266e4877fc74c7bf53579c926b --- /dev/null +++ b/pytorch_model-00077-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e4d75362ef7a78d64c51df7b7a7276b0b7a02641cce7091f2b390373bd1c94 +size 668490896 diff --git a/pytorch_model-00078-of-00082.bin b/pytorch_model-00078-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8434c1b4df43d646559b7131693a8e943c6c4a2 --- /dev/null +++ b/pytorch_model-00078-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6e8e8a506ac480b7663483317f9562fdb5b8ffcda6c4442927b40fe614d9bd +size 283116795 diff --git a/pytorch_model-00079-of-00082.bin b/pytorch_model-00079-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f4c87ecedca3923d8b308cfd4f9cbd7154b1d069 --- /dev/null +++ b/pytorch_model-00079-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55d7f0f266fd46923ed5b66c8bbc57a4a2d0e0a75c972caa26270f7c6f8577c +size 668490896 diff --git a/pytorch_model-00080-of-00082.bin b/pytorch_model-00080-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fedf94e52ef9bb07e67d0abee14db0b30ab7c86e --- /dev/null +++ b/pytorch_model-00080-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153c78065e32366f6aaabb34f329a70bbbd6ae0cd668076f6d60230666852a54 +size 283116795 diff --git a/pytorch_model-00081-of-00082.bin b/pytorch_model-00081-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e26932c2da17992ab465f0c5acf341e5b8431bc5 --- /dev/null +++ b/pytorch_model-00081-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45576a40edbfc363b894ddf5d279fe0f9108fe038eefec0edc4b4ac9113c1e8a +size 786464332 diff --git a/pytorch_model-00082-of-00082.bin b/pytorch_model-00082-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..51c9578c074b52c31a70f29c3568073a3ff4c139 --- /dev/null +++ b/pytorch_model-00082-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce01d2dc7af50e478871f03ded33345260231b695fb9f14b6ce8afafeea24873 +size 327680938 diff --git a/pytorch_model.bin.index.json b/pytorch_model.bin.index.json new file mode 100644 index 0000000000000000000000000000000000000000..7b598b9c532fda2bfe7c08e8df7232ac23a47e2f --- /dev/null +++ b/pytorch_model.bin.index.json @@ -0,0 +1,410 @@ +{ + "metadata": { + "total_size": 26031738880 + }, + "weight_map": { + "base_model.model.lm_head.weight": "pytorch_model-00082-of-00082.bin", + "model.embed_tokens.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.input_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.down_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.gate_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.mlp.up_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.post_attention_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.self_attn.k_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.o_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.q_proj.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.self_attn.rotary_emb.inv_freq": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.v_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.1.input_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.mlp.down_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.gate_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.up_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.post_attention_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.self_attn.k_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.o_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.q_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.rotary_emb.inv_freq": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.v_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.10.input_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.mlp.down_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.gate_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.up_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.post_attention_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.self_attn.k_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.o_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.q_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.rotary_emb.inv_freq": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.v_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.11.input_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.mlp.down_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.gate_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.up_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.post_attention_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.self_attn.k_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.o_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.q_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.rotary_emb.inv_freq": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.v_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.12.input_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.mlp.down_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.gate_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.up_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.post_attention_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.self_attn.k_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.o_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.q_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.rotary_emb.inv_freq": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.v_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.13.input_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.mlp.down_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.gate_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.up_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.post_attention_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.self_attn.k_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.o_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.q_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.rotary_emb.inv_freq": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.v_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.14.input_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.mlp.down_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.gate_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.up_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.post_attention_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.self_attn.k_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.o_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.q_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.rotary_emb.inv_freq": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.v_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.15.input_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.mlp.down_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.gate_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.up_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.post_attention_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.self_attn.k_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.o_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.q_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.rotary_emb.inv_freq": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.v_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.16.input_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.mlp.down_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.gate_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.up_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.post_attention_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.self_attn.k_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.o_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.q_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.rotary_emb.inv_freq": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.v_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.17.input_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.mlp.down_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.gate_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.up_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.post_attention_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.self_attn.k_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.o_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.q_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.rotary_emb.inv_freq": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.v_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.18.input_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.mlp.down_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.gate_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.up_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.post_attention_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.self_attn.k_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.o_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.q_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.rotary_emb.inv_freq": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.v_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.19.input_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.mlp.down_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.gate_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.up_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.post_attention_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.self_attn.k_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.o_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.q_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.rotary_emb.inv_freq": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.v_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.2.input_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.mlp.down_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.gate_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.up_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.post_attention_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.self_attn.k_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.o_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.q_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.rotary_emb.inv_freq": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.v_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.20.input_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.mlp.down_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.gate_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.up_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.post_attention_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.self_attn.k_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.o_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.q_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.rotary_emb.inv_freq": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.v_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.21.input_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.mlp.down_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.gate_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.up_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.post_attention_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.self_attn.k_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.o_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.q_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.rotary_emb.inv_freq": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.v_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.22.input_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.mlp.down_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.gate_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.up_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.post_attention_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.self_attn.k_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.rotary_emb.inv_freq": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.23.input_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.mlp.down_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.up_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.rotary_emb.inv_freq": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.v_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.24.input_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.mlp.down_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.gate_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.up_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.post_attention_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.self_attn.k_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.o_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.q_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.rotary_emb.inv_freq": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.v_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.25.input_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.mlp.down_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.gate_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.up_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.post_attention_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.self_attn.k_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.o_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.q_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.rotary_emb.inv_freq": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.v_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.26.input_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.mlp.down_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.gate_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.up_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.post_attention_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.self_attn.k_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.o_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.q_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.rotary_emb.inv_freq": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.v_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.27.input_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.mlp.down_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.gate_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.up_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.post_attention_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.self_attn.k_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.o_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.q_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.rotary_emb.inv_freq": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.v_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.28.input_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.mlp.down_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.gate_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.up_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.post_attention_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.self_attn.k_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.o_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.q_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.rotary_emb.inv_freq": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.v_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.29.input_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.mlp.down_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.gate_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.up_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.post_attention_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.self_attn.k_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.o_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.q_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.rotary_emb.inv_freq": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.v_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.3.input_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.mlp.down_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.gate_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.up_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.post_attention_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.self_attn.k_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.o_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.q_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.rotary_emb.inv_freq": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.v_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.30.input_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.mlp.down_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.gate_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.up_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.post_attention_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.self_attn.k_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.o_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.q_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.rotary_emb.inv_freq": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.v_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.31.input_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.mlp.down_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.gate_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.up_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.post_attention_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.self_attn.k_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.o_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.q_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.rotary_emb.inv_freq": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.v_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.32.input_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.mlp.down_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.gate_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.up_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.post_attention_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.self_attn.k_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.o_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.q_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.rotary_emb.inv_freq": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.v_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.33.input_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.mlp.down_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.gate_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.up_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.post_attention_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.self_attn.k_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.o_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.q_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.rotary_emb.inv_freq": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.v_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.34.input_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.mlp.down_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.gate_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.up_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.post_attention_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.self_attn.k_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.o_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.q_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.rotary_emb.inv_freq": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.v_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.35.input_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.mlp.down_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.gate_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.up_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.post_attention_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.self_attn.k_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.o_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.q_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.rotary_emb.inv_freq": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.v_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.36.input_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.mlp.down_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.gate_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.up_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.post_attention_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.self_attn.k_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.o_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.q_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.rotary_emb.inv_freq": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.v_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.37.input_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.mlp.down_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.gate_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.up_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.post_attention_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.self_attn.k_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.o_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.q_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.rotary_emb.inv_freq": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.v_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.38.input_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.mlp.down_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.gate_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.up_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.post_attention_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.self_attn.k_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.o_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.q_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.rotary_emb.inv_freq": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.v_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.39.input_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.mlp.down_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.gate_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.up_proj.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.post_attention_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.self_attn.k_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.o_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.q_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.rotary_emb.inv_freq": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.v_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.4.input_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.mlp.down_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.gate_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.up_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.post_attention_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.self_attn.k_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.o_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.q_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.rotary_emb.inv_freq": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.v_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.5.input_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.mlp.down_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.gate_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.up_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.post_attention_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.self_attn.k_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.o_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.q_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.rotary_emb.inv_freq": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.v_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.6.input_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.mlp.down_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.gate_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.up_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.post_attention_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.self_attn.k_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.o_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.q_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.rotary_emb.inv_freq": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.v_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.7.input_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.mlp.down_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.gate_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.up_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.post_attention_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.self_attn.k_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.o_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.q_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.rotary_emb.inv_freq": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.v_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.8.input_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.mlp.down_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.gate_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.up_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.post_attention_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.self_attn.k_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.o_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.q_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.rotary_emb.inv_freq": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.v_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.9.input_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.mlp.down_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.gate_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.up_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.post_attention_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.self_attn.k_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.o_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.q_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.rotary_emb.inv_freq": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.v_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.norm.weight": "pytorch_model-00081-of-00082.bin" + } +}