diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..36913369aa5f70f18c97a565e45bef61cbe8f7c5 --- /dev/null +++ b/config.json @@ -0,0 +1,23 @@ +{ + "_name_or_path": "yahma/llama-13b-hf", + "architectures": [ + "LlamaForCausalLM" + ], + "bos_token_id": 1, + "eos_token_id": 2, + "hidden_act": "silu", + "hidden_size": 5120, + "initializer_range": 0.02, + "intermediate_size": 13824, + "max_position_embeddings": 2048, + "model_type": "llama", + "num_attention_heads": 40, + "num_hidden_layers": 40, + "pad_token_id": 0, + "rms_norm_eps": 1e-06, + "tie_word_embeddings": false, + "torch_dtype": "float16", + "transformers_version": "4.28.1", + "use_cache": true, + "vocab_size": 32000 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..1372199d8db4c7b56921c19c5306013ce5b3c62d --- /dev/null +++ b/generation_config.json @@ -0,0 +1,7 @@ +{ + "_from_model_config": true, + "bos_token_id": 1, + "eos_token_id": 2, + "pad_token_id": 0, + "transformers_version": "4.28.1" +} diff --git a/pytorch_model-00001-of-00082.bin b/pytorch_model-00001-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc23bdabb9074b815bc85a52194a4c427225682c --- /dev/null +++ b/pytorch_model-00001-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c7da175fcf53562169433889e6f2744229a8b68f8cc8d2f24e37fb998782fc +size 380110075 diff --git a/pytorch_model-00002-of-00082.bin b/pytorch_model-00002-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f045cffae56eb735dee610e49b642395f29226dc --- /dev/null +++ b/pytorch_model-00002-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb354a6c54d513510fd47e6aaba33732edc733a5785c7b2e6db6ada07ce73a0 +size 298846638 diff --git a/pytorch_model-00003-of-00082.bin b/pytorch_model-00003-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3951c241afa071e848b86004c39d9f2bc2add391 --- /dev/null +++ b/pytorch_model-00003-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24536891ceb2a899323903c657e50b423240a17efdd077ca3d947943297c22c3 +size 387996095 diff --git a/pytorch_model-00004-of-00082.bin b/pytorch_model-00004-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..aecbddd05419ceac5fdd58b562cd90006404b4f5 --- /dev/null +++ b/pytorch_model-00004-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ededbaa7908086b6234b1312f43024f8057a60af10bafd62b36a3f5ce3c69187 +size 387975598 diff --git a/pytorch_model-00005-of-00082.bin b/pytorch_model-00005-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1da92f1c92a4a1869bdab95b5f9c51849b78a903 --- /dev/null +++ b/pytorch_model-00005-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c9ef468667a6cc28ba95b7efb893f6ff4cdc6c3982b92948b0ee6da93c227d3 +size 351296801 diff --git a/pytorch_model-00006-of-00082.bin b/pytorch_model-00006-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..357a8e07dc9f069a793a4cb5c772dc927222dd27 --- /dev/null +++ b/pytorch_model-00006-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cc1c552640ca98eb953174f314be35003e7d0a83cd66876dfc2503213d47599 +size 283116795 diff --git a/pytorch_model-00007-of-00082.bin b/pytorch_model-00007-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..77e999cace9a2e133f8fdd68a9f32f4e73562b27 --- /dev/null +++ b/pytorch_model-00007-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea30982eadad08255b3020d7808b86b540f9d5483ce903f09225c718c648e9cd +size 351296801 diff --git a/pytorch_model-00008-of-00082.bin b/pytorch_model-00008-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8677493c4cd36c57b2e669f2567150c869840cbc --- /dev/null +++ b/pytorch_model-00008-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d80edfca8890f5fa22322cd6a7a074cf8ac967766693d97adc3169ea734ad75 +size 283116795 diff --git a/pytorch_model-00009-of-00082.bin b/pytorch_model-00009-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..47b67dfa6b59617335bd869712b5524f5224e9e2 --- /dev/null +++ b/pytorch_model-00009-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5133d32a237bf50c6fe2519920c9fde4469574783e2be786436cf90ea14f1348 +size 351296801 diff --git a/pytorch_model-00010-of-00082.bin b/pytorch_model-00010-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d03ddd77c776a7649998f759a802c0e1288c0282 --- /dev/null +++ b/pytorch_model-00010-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e29f91a92127ef330e71f0f664b8d3ada8526427ed6ef8a85efd6a668b8f60 +size 283116795 diff --git a/pytorch_model-00011-of-00082.bin b/pytorch_model-00011-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d831b604b3bba6ae482060379f55a5da46e5dca8 --- /dev/null +++ b/pytorch_model-00011-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:840a0b44cd4ad026f1567ca83dc301a6d75ecb463a8ca4a968cf55b53f67e4a7 +size 351296801 diff --git a/pytorch_model-00012-of-00082.bin b/pytorch_model-00012-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dc44cc388c43ef7552244a052ad564c31739a0a --- /dev/null +++ b/pytorch_model-00012-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26136f021a572bc5545c45366793f328b27ba7a817169e882ee43512ed920986 +size 283116795 diff --git a/pytorch_model-00013-of-00082.bin b/pytorch_model-00013-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..94fd7015d51ac9e0e587c3e59cf93fd184c1f4a2 --- /dev/null +++ b/pytorch_model-00013-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0848c5839098277023e9b553c3b8c68ced3b60608c5d8919080f3373ac6162fd +size 351296801 diff --git a/pytorch_model-00014-of-00082.bin b/pytorch_model-00014-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f76074b851a2e0adb596955f2cebbf4624d6d176 --- /dev/null +++ b/pytorch_model-00014-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad550ac7984955710c3aef53b3cf44b675736373cced6bdde2c10bd90fd05e00 +size 283116795 diff --git a/pytorch_model-00015-of-00082.bin b/pytorch_model-00015-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..40392639cfb1d64f877eb77aadccfd7688ff0898 --- /dev/null +++ b/pytorch_model-00015-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af57bbab71bdeedf731053883da82ff247eb845a49d828eb2f38f1873a8ff201 +size 351296801 diff --git a/pytorch_model-00016-of-00082.bin b/pytorch_model-00016-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..10ee4d4ffbd2be738c61b5d2955e77e90b648284 --- /dev/null +++ b/pytorch_model-00016-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8291046bbb599b31c293ce23e3174a87834c97e765d37aff394a8227c120ffcb +size 283116795 diff --git a/pytorch_model-00017-of-00082.bin b/pytorch_model-00017-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f38483b7888ac573f368add8e892b6431bfd624b --- /dev/null +++ b/pytorch_model-00017-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8746f649c74ba8c4261a19c9dc1df15e2fadd28e503e1220f902ff139ed245ec +size 351296801 diff --git a/pytorch_model-00018-of-00082.bin b/pytorch_model-00018-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e6e67161e363674e5933b9ebc814b107e6e76d1 --- /dev/null +++ b/pytorch_model-00018-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25c2a779547ff1bfea36dd16d6ce68844d784c3594f502aa8279723fbb54bfc +size 283116795 diff --git a/pytorch_model-00019-of-00082.bin b/pytorch_model-00019-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb79899f5a4b5a729f228775e48235dfd4281638 --- /dev/null +++ b/pytorch_model-00019-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79c54f5663ec82dc431f47ca5ae1af6eb82d7fa08d9dcc0e9cca95544331619 +size 351296801 diff --git a/pytorch_model-00020-of-00082.bin b/pytorch_model-00020-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..edfb3fbb39b468301570d6f86d87706d92294cd7 --- /dev/null +++ b/pytorch_model-00020-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf8ba21239f070b3dddf08b428a032ec1a0f0b97adf91d614db67685b8a2f3c +size 283116795 diff --git a/pytorch_model-00021-of-00082.bin b/pytorch_model-00021-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d75f57405f68cdeef7ffb81024c171481639d246 --- /dev/null +++ b/pytorch_model-00021-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d793fcdb8b3afd872f9936d4a9b189e5a8d1b17ba87f1dcc43ac8fddcdaead +size 351296865 diff --git a/pytorch_model-00022-of-00082.bin b/pytorch_model-00022-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..08e30781089efed1fc42331db4943b7eec37c22d --- /dev/null +++ b/pytorch_model-00022-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c538c86a2cb6f36a03ee39afeb1fbd580c169b6d25b27108e3a6539b68cd8f1 +size 283116795 diff --git a/pytorch_model-00023-of-00082.bin b/pytorch_model-00023-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1b75588eb36262e0511275f2d2af3ed1c22e50b6 --- /dev/null +++ b/pytorch_model-00023-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992f8302d94089e0135acd7024a1cc141d97d1c6150eec1832310b6e9d7bc1d0 +size 351296865 diff --git a/pytorch_model-00024-of-00082.bin b/pytorch_model-00024-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad36a39e79b2883251924da5f297a8870441a325 --- /dev/null +++ b/pytorch_model-00024-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6591f1b2560ba2159919148ccd3d14edc04503f2d006ed1b15b57c57f626e9e9 +size 283116795 diff --git a/pytorch_model-00025-of-00082.bin b/pytorch_model-00025-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..037c70a4a7168f2f5fad06dda2a7e098844d1130 --- /dev/null +++ b/pytorch_model-00025-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c359b470c0d31a931c8cd4f267b216bab86ba09aeb84905fd93863a22f07e118 +size 351296865 diff --git a/pytorch_model-00026-of-00082.bin b/pytorch_model-00026-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b1d3ef696bb24a46397b4b177c482422026f37b --- /dev/null +++ b/pytorch_model-00026-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eee6652908ce206baf7357d9f5d8ad301a8f8d79428aec99ef7dec3b32e646 +size 283116795 diff --git a/pytorch_model-00027-of-00082.bin b/pytorch_model-00027-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..40453581830ecc9d90d3887c292811b90e9733ac --- /dev/null +++ b/pytorch_model-00027-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5aa062126e656b7b827317e53fc7107900bb80b4b3fa60b078d030f6ab0173b +size 351296865 diff --git a/pytorch_model-00028-of-00082.bin b/pytorch_model-00028-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8bc06c4502866ee765ff1742345d92fd8a518579 --- /dev/null +++ b/pytorch_model-00028-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4242a2a58ee759158f020d7164b669b278a82c23eba7c40ba9e25068c2b91ce +size 283116795 diff --git a/pytorch_model-00029-of-00082.bin b/pytorch_model-00029-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..af6d6466b39822a856d10cd7c70edca6cf3c097e --- /dev/null +++ b/pytorch_model-00029-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35008f8ccf2b6700af2f6adcb15b20fac1cd320fec048915613e428ed9599c4d +size 351296865 diff --git a/pytorch_model-00030-of-00082.bin b/pytorch_model-00030-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..008b4aa2912bc378c15b46bafc75976237f22116 --- /dev/null +++ b/pytorch_model-00030-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e1dc8c99a219094b4464fa6c4e7d16de5851ed53b1a94444c6f8045a5ebef9a +size 283116795 diff --git a/pytorch_model-00031-of-00082.bin b/pytorch_model-00031-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7cc9bc56f8756518d831db4aba9410b35a134347 --- /dev/null +++ b/pytorch_model-00031-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395f06916d869dd1fa2d419bacc27d75692319b8061206f0bcb0649c597e2415 +size 351296865 diff --git a/pytorch_model-00032-of-00082.bin b/pytorch_model-00032-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa184fc30de69e72b83ada5d64de91de9c5af5ee --- /dev/null +++ b/pytorch_model-00032-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d21051227d43ddb58ae705034715939d70ada16a19c8d009003779174b62ad7 +size 283116795 diff --git a/pytorch_model-00033-of-00082.bin b/pytorch_model-00033-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..930a0c4d790533438d5a5db2592c1899d596c191 --- /dev/null +++ b/pytorch_model-00033-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3d38a5913bbd85dede3751e2117aa5c4b5d28da5721a5e7e1c532440bbecef +size 351296865 diff --git a/pytorch_model-00034-of-00082.bin b/pytorch_model-00034-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2391de0b4b48b010c30b76ecf93517c2ae2c19d2 --- /dev/null +++ b/pytorch_model-00034-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d881ebfef6c0f21c05c8d19a58dee4715b720f7448041aebd37c95c34d440eda +size 283116795 diff --git a/pytorch_model-00035-of-00082.bin b/pytorch_model-00035-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..8c419300b0fdeadd07c41c599526fa2e42f61637 --- /dev/null +++ b/pytorch_model-00035-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd5dceb63ac732c867e954902be3165dc60478ca2ea3cf4c480ea456e40cbcdb +size 351296865 diff --git a/pytorch_model-00036-of-00082.bin b/pytorch_model-00036-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..323cf0ebb49aac5ce575a1c29f8cbc05c7a2afc9 --- /dev/null +++ b/pytorch_model-00036-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d315936eb49804cd38444850a42a62b6f1190b55fff13d9a8ebd79abe0043045 +size 283116795 diff --git a/pytorch_model-00037-of-00082.bin b/pytorch_model-00037-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b5e8ef0d9dcfc7d34e840de1f24ea1f40303574 --- /dev/null +++ b/pytorch_model-00037-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f843b1fb91ee4b68f62f9242d5e9246461bc1e976cf725a0c7521ff80cfb52ae +size 351296865 diff --git a/pytorch_model-00038-of-00082.bin b/pytorch_model-00038-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..0cc5eeb7a99c0672ca99496e44cebbfa40d42b80 --- /dev/null +++ b/pytorch_model-00038-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a48a714ba461c060ef66cd735cf8096b1b097365e9538bde4369250c1f36d044 +size 283116795 diff --git a/pytorch_model-00039-of-00082.bin b/pytorch_model-00039-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..76a8d1f578c85066ba9bdc12012c27cece0c24a2 --- /dev/null +++ b/pytorch_model-00039-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:546bfa5c4f65ae0c72b89f9da21eda017258ba949c5f2d7a59e53dd66aa18caf +size 351296865 diff --git a/pytorch_model-00040-of-00082.bin b/pytorch_model-00040-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..cde7a16ff10c2ef84dd3c07da31bf4ab1b69adc1 --- /dev/null +++ b/pytorch_model-00040-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b776517d136e5f14cb85f31e02a4c63e460d3e2eec62008e7de6ea236825ff51 +size 283116795 diff --git a/pytorch_model-00041-of-00082.bin b/pytorch_model-00041-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2560c143aea7db837029f42052ea6d0164a422d1 --- /dev/null +++ b/pytorch_model-00041-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:870a46c933f864e5d1faf00b9f3eb708f2e2e71e5ef2c356b9ef06fc7b798435 +size 351296865 diff --git a/pytorch_model-00042-of-00082.bin b/pytorch_model-00042-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0a47275068a00ee3447a45ec987f23e22a8e0ca --- /dev/null +++ b/pytorch_model-00042-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63fe9b47295b20f5c5a60bb36f5a6f6e314ebe57e34a4c430b0da3092179aa4 +size 283116795 diff --git a/pytorch_model-00043-of-00082.bin b/pytorch_model-00043-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..32bde535fdcb79a35a2222f2c1cdc287d8b893f4 --- /dev/null +++ b/pytorch_model-00043-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90341daad8311738c63e10491683703f71301d2fa41d1b3e56d21c4a05102282 +size 351296865 diff --git a/pytorch_model-00044-of-00082.bin b/pytorch_model-00044-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7a20536dbe8a13b0031d74d8b520d1e863757bfe --- /dev/null +++ b/pytorch_model-00044-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f490f7529120107a27b4967fc45616554d7690ebfef90340bd78afe4f3dfc9c4 +size 283116795 diff --git a/pytorch_model-00045-of-00082.bin b/pytorch_model-00045-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..78339cc3516ec871080de016c5e5399cd71e650e --- /dev/null +++ b/pytorch_model-00045-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa64cf66854887e753c973a208b8d282bdb23ac581976ad490e699ba7de93b24 +size 351296865 diff --git a/pytorch_model-00046-of-00082.bin b/pytorch_model-00046-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2661ad2b5e66b355dfbaaf0c7a190a792f3fb893 --- /dev/null +++ b/pytorch_model-00046-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:963c52db583c853a94492302ed24175739788a8e506e8f6e10967d1c98fe49e7 +size 283116795 diff --git a/pytorch_model-00047-of-00082.bin b/pytorch_model-00047-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7805ace0ed71689aa183cfe805f2d98beaeb9a24 --- /dev/null +++ b/pytorch_model-00047-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:003079433b13a8ac31276a8c12fe3c2b8ab1afffd20bd14ab55e83021fa1aacd +size 351296865 diff --git a/pytorch_model-00048-of-00082.bin b/pytorch_model-00048-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ebd44f8ab95a2a870c893359c9e2fdb6bb78be2 --- /dev/null +++ b/pytorch_model-00048-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e65b070c829a8a340fc527208e4a86642cbb4bce46c2df9dd3ad2b7dcede1a8 +size 283116795 diff --git a/pytorch_model-00049-of-00082.bin b/pytorch_model-00049-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2777b0d4185ca960ff246becf3707ef192b53663 --- /dev/null +++ b/pytorch_model-00049-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:704cbbd3d1903d252986c7cdb4ac7f2d3ef98ec164467e03eaee6746f0232435 +size 351296865 diff --git a/pytorch_model-00050-of-00082.bin b/pytorch_model-00050-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..97c0d1b131331958d76d9cf7a06be78d215fa839 --- /dev/null +++ b/pytorch_model-00050-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a450672e6cbd1662afd63d5df8fdc8403b756660924981293a5b8914b1a0098 +size 283116795 diff --git a/pytorch_model-00051-of-00082.bin b/pytorch_model-00051-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..2eafb4c87a738834d9d1700e2e1e787391b83b7b --- /dev/null +++ b/pytorch_model-00051-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:294fcb2f94f4b136b56616db18b079113f80e360592fc8db3adb1652d2073e0c +size 351296865 diff --git a/pytorch_model-00052-of-00082.bin b/pytorch_model-00052-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..68503a1007d7bc2cdc1eaddb559d4f9140e2f661 --- /dev/null +++ b/pytorch_model-00052-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37f281c2089e5df89852267702e03082654361db15e14eeb499d3f4d0ba641c +size 283116795 diff --git a/pytorch_model-00053-of-00082.bin b/pytorch_model-00053-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b5ff8b5ed75a8a9e53c59e8ac3b030725933f3d6 --- /dev/null +++ b/pytorch_model-00053-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8979d4783799b88bc8a4e652fded2e0f6340ffd961869d6bca93eb9db08a525 +size 351296865 diff --git a/pytorch_model-00054-of-00082.bin b/pytorch_model-00054-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7e6272daa4ee027c0d50beb3ab31ed1ac31b92a --- /dev/null +++ b/pytorch_model-00054-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea497fd39a273ef3548d639029ee5dac5369c9234313ab5adb807e652c7ea88e +size 283116795 diff --git a/pytorch_model-00055-of-00082.bin b/pytorch_model-00055-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..80874e6c7b1fa8057f58c693633712aa18a952c9 --- /dev/null +++ b/pytorch_model-00055-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c0e0290e8ba6d1a0113b1748c560865547b4ab05a3668ce77116cfe4b758200 +size 351296865 diff --git a/pytorch_model-00056-of-00082.bin b/pytorch_model-00056-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..292db6b253b2b8e1575cb6fc6902623ebbba8de7 --- /dev/null +++ b/pytorch_model-00056-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3516e224b00db94be2369cdb79a26252ef59d1035f882494f8eee3a7430803b +size 283116795 diff --git a/pytorch_model-00057-of-00082.bin b/pytorch_model-00057-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e55c6cc767102577e9cefc3734a202504b39ae9 --- /dev/null +++ b/pytorch_model-00057-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126480c4e402c196d3242e20bfe6f9d1224f00a3250e9659880e58944d56890c +size 351296865 diff --git a/pytorch_model-00058-of-00082.bin b/pytorch_model-00058-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..634d5bbbc3480dc3d63d78049f1bd60805f29aa1 --- /dev/null +++ b/pytorch_model-00058-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e0eaef3c37133f5398f5037e8ad0de1590cdd150ac27d5232187f513ff716be +size 283116795 diff --git a/pytorch_model-00059-of-00082.bin b/pytorch_model-00059-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..350a60390dbab014e355166d39f9f29f2d8497d2 --- /dev/null +++ b/pytorch_model-00059-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95781092074a6c04c149f309fa3eeff8d10d4859bcfe5b08b987966dcd1659ed +size 351296865 diff --git a/pytorch_model-00060-of-00082.bin b/pytorch_model-00060-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..59041dae0c8794cd217762dd2fa672cbb700e30b --- /dev/null +++ b/pytorch_model-00060-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb609dbcf9246c840aad81709f99a941c91a996761770326f6827a2666649f6 +size 283116795 diff --git a/pytorch_model-00061-of-00082.bin b/pytorch_model-00061-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b628b574fcc0836c2911373ae29782e1cabe119 --- /dev/null +++ b/pytorch_model-00061-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb510b1aef676267e1b4a5184789972eacf786ca44441352741e711218a34264 +size 351296865 diff --git a/pytorch_model-00062-of-00082.bin b/pytorch_model-00062-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..bcd374814524160180a4d69e7bbbdb981e575aad --- /dev/null +++ b/pytorch_model-00062-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab2404d8f80ec7c0a34d0a68c89ab7921bcfe3822ec0b3fcda57e46708ab6982 +size 283116795 diff --git a/pytorch_model-00063-of-00082.bin b/pytorch_model-00063-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..e136e18069033094dd388abd817dc7a1407fb351 --- /dev/null +++ b/pytorch_model-00063-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d83b3c0d7d957f0ef0ff7eab8cf0a3e12ea84254e28dca2beb6cf146f07ac36 +size 351296865 diff --git a/pytorch_model-00064-of-00082.bin b/pytorch_model-00064-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c6b7c399419d69ead21bc3c805991b13119323b --- /dev/null +++ b/pytorch_model-00064-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd16b03bb7c34197619ac71bce209ef1eba87748168a19894b222b6f0ca837de +size 283116795 diff --git a/pytorch_model-00065-of-00082.bin b/pytorch_model-00065-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ac669dd656b554a1d8e333d62d10e0946f8b357 --- /dev/null +++ b/pytorch_model-00065-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e2dc6284ac0bad33e1bd795e619c577accf65f928823f364e7d3ece8ea6b7d +size 351296865 diff --git a/pytorch_model-00066-of-00082.bin b/pytorch_model-00066-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..07f3512e6a4e8b6303618fb87983df0edff6d96e --- /dev/null +++ b/pytorch_model-00066-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:287b0055cd6c213d5537d297f39dee8238a9ac75e90c4ae2cd150b48b01eae37 +size 283116795 diff --git a/pytorch_model-00067-of-00082.bin b/pytorch_model-00067-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..07d91bcc37bf5d9463eb8b5657a6abef3e456bf6 --- /dev/null +++ b/pytorch_model-00067-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1895532303da363c6d80645d6bc8c64376e891b820d742053f60d3ebb5e47c9 +size 351296865 diff --git a/pytorch_model-00068-of-00082.bin b/pytorch_model-00068-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e6ab793c98eb3cdb7b7c37d255258b999fd5b66 --- /dev/null +++ b/pytorch_model-00068-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8133dff37c97e3c787b596afcfee9187ccc4f98fc6a049f6ade30667ef0c5dc9 +size 283116795 diff --git a/pytorch_model-00069-of-00082.bin b/pytorch_model-00069-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f998d3d5b4f361ce0ac4e3ecdb65c734f28b8660 --- /dev/null +++ b/pytorch_model-00069-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7d5719804f6dc6397d3322869f30017a951e6d5f075b174ad092e8d073a6bf +size 351296865 diff --git a/pytorch_model-00070-of-00082.bin b/pytorch_model-00070-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9464b16867821776bb0b78fdc11c1e3e8608e39 --- /dev/null +++ b/pytorch_model-00070-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f09b9e414918496844673f7028e3be069fd2224d3f15c42b6390399ab9013b +size 283116795 diff --git a/pytorch_model-00071-of-00082.bin b/pytorch_model-00071-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..bcf86927de923619c660251fb36ba4394f873df9 --- /dev/null +++ b/pytorch_model-00071-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dede38e7e936664cee034a2024c31979de3720d97f75f5720799e34b7f1aa6d +size 351296865 diff --git a/pytorch_model-00072-of-00082.bin b/pytorch_model-00072-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..7e5d3eb6ca30f1d22751da7b86eb652c8fc448cb --- /dev/null +++ b/pytorch_model-00072-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87b432946a6195b4f93f0c0c3045f38541c6254e782098bef4cda8c1387989b1 +size 283116795 diff --git a/pytorch_model-00073-of-00082.bin b/pytorch_model-00073-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..eae623b62afdf5d47cc4565a3d67f46811673c07 --- /dev/null +++ b/pytorch_model-00073-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b8c282fe50b9c4c176666f57b8c30aa13c39c253293afac30bbfcc04b331cff +size 351296865 diff --git a/pytorch_model-00074-of-00082.bin b/pytorch_model-00074-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8f73ce9cdd14464e71ad4f6e1392cde8debd202 --- /dev/null +++ b/pytorch_model-00074-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224ea5ebc9d1868d5f40ca08d85c4070542d4be11b3d638893d3e6a9aeeac402 +size 283116795 diff --git a/pytorch_model-00075-of-00082.bin b/pytorch_model-00075-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9d737c37a209f495c26b76df33c6a28634c6535 --- /dev/null +++ b/pytorch_model-00075-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d3466c1ae65ea64e28b6e18e03bc7a56c77462670dde0ebd5d5ff39bf543b36 +size 351296865 diff --git a/pytorch_model-00076-of-00082.bin b/pytorch_model-00076-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..976473a25e230e342101b10d577567e06ffb5f38 --- /dev/null +++ b/pytorch_model-00076-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9355f4cdef3c2e54f8da6b5afe4bc229be89492f6a4ea5edeecaadc32441f7c5 +size 283116795 diff --git a/pytorch_model-00077-of-00082.bin b/pytorch_model-00077-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..5707899b96b1b7ebdc17fb59fe3926ad2e46fee8 --- /dev/null +++ b/pytorch_model-00077-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f211856fbd5e15b78e9f2fd7c53411830c85927c0faaa24951c12b8db5cea2c3 +size 351296865 diff --git a/pytorch_model-00078-of-00082.bin b/pytorch_model-00078-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8434c1b4df43d646559b7131693a8e943c6c4a2 --- /dev/null +++ b/pytorch_model-00078-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd6e8e8a506ac480b7663483317f9562fdb5b8ffcda6c4442927b40fe614d9bd +size 283116795 diff --git a/pytorch_model-00079-of-00082.bin b/pytorch_model-00079-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef4ffa891a4b720c7da7548664e3efa22d6b3d49 --- /dev/null +++ b/pytorch_model-00079-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4ebb3c715f5828bf0fb6cce4bb60615be5dd9b0e5bf26a928cda249b4ea05c +size 351296865 diff --git a/pytorch_model-00080-of-00082.bin b/pytorch_model-00080-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..fedf94e52ef9bb07e67d0abee14db0b30ab7c86e --- /dev/null +++ b/pytorch_model-00080-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153c78065e32366f6aaabb34f329a70bbbd6ae0cd668076f6d60230666852a54 +size 283116795 diff --git a/pytorch_model-00081-of-00082.bin b/pytorch_model-00081-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..bf7f1d90cc07a265ad3c78fb8148dc795527930c --- /dev/null +++ b/pytorch_model-00081-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b399e7f129dcdfc92ac850de84974411d115ea8b0bc0cad46923e2400bebdaaf +size 469270301 diff --git a/pytorch_model-00082-of-00082.bin b/pytorch_model-00082-of-00082.bin new file mode 100644 index 0000000000000000000000000000000000000000..aeadcc189df9d810b2dc9587b9fa7da6fa711b3d --- /dev/null +++ b/pytorch_model-00082-of-00082.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97114576d6423820ea4a95b4fbf2f646d519765dc3b7d849363b476254b9a3ba +size 327680938 diff --git a/pytorch_model.bin.index.json b/pytorch_model.bin.index.json new file mode 100644 index 0000000000000000000000000000000000000000..e684cedb1a653453ef5bec1df2994064d057ee48 --- /dev/null +++ b/pytorch_model.bin.index.json @@ -0,0 +1,410 @@ +{ + "metadata": { + "total_size": 26031738880 + }, + "weight_map": { + "lm_head.weight": "pytorch_model-00082-of-00082.bin", + "model.embed_tokens.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.input_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.down_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.mlp.gate_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.mlp.up_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.post_attention_layernorm.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.0.self_attn.k_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.o_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.q_proj.weight": "pytorch_model-00001-of-00082.bin", + "model.layers.0.self_attn.rotary_emb.inv_freq": "pytorch_model-00002-of-00082.bin", + "model.layers.0.self_attn.v_proj.weight": "pytorch_model-00002-of-00082.bin", + "model.layers.1.input_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.mlp.down_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.gate_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.mlp.up_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.post_attention_layernorm.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.1.self_attn.k_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.o_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.q_proj.weight": "pytorch_model-00003-of-00082.bin", + "model.layers.1.self_attn.rotary_emb.inv_freq": "pytorch_model-00004-of-00082.bin", + "model.layers.1.self_attn.v_proj.weight": "pytorch_model-00004-of-00082.bin", + "model.layers.10.input_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.mlp.down_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.gate_proj.weight": "pytorch_model-00022-of-00082.bin", + "model.layers.10.mlp.up_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.post_attention_layernorm.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.10.self_attn.k_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.o_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.q_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.rotary_emb.inv_freq": "pytorch_model-00021-of-00082.bin", + "model.layers.10.self_attn.v_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.11.input_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.mlp.down_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.gate_proj.weight": "pytorch_model-00024-of-00082.bin", + "model.layers.11.mlp.up_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.post_attention_layernorm.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.11.self_attn.k_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.o_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.q_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.rotary_emb.inv_freq": "pytorch_model-00023-of-00082.bin", + "model.layers.11.self_attn.v_proj.weight": "pytorch_model-00023-of-00082.bin", + "model.layers.12.input_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.mlp.down_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.gate_proj.weight": "pytorch_model-00026-of-00082.bin", + "model.layers.12.mlp.up_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.post_attention_layernorm.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.12.self_attn.k_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.o_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.q_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.rotary_emb.inv_freq": "pytorch_model-00025-of-00082.bin", + "model.layers.12.self_attn.v_proj.weight": "pytorch_model-00025-of-00082.bin", + "model.layers.13.input_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.mlp.down_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.gate_proj.weight": "pytorch_model-00028-of-00082.bin", + "model.layers.13.mlp.up_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.post_attention_layernorm.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.13.self_attn.k_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.o_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.q_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.rotary_emb.inv_freq": "pytorch_model-00027-of-00082.bin", + "model.layers.13.self_attn.v_proj.weight": "pytorch_model-00027-of-00082.bin", + "model.layers.14.input_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.mlp.down_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.gate_proj.weight": "pytorch_model-00030-of-00082.bin", + "model.layers.14.mlp.up_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.post_attention_layernorm.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.14.self_attn.k_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.o_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.q_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.rotary_emb.inv_freq": "pytorch_model-00029-of-00082.bin", + "model.layers.14.self_attn.v_proj.weight": "pytorch_model-00029-of-00082.bin", + "model.layers.15.input_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.mlp.down_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.gate_proj.weight": "pytorch_model-00032-of-00082.bin", + "model.layers.15.mlp.up_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.post_attention_layernorm.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.15.self_attn.k_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.o_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.q_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.rotary_emb.inv_freq": "pytorch_model-00031-of-00082.bin", + "model.layers.15.self_attn.v_proj.weight": "pytorch_model-00031-of-00082.bin", + "model.layers.16.input_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.mlp.down_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.gate_proj.weight": "pytorch_model-00034-of-00082.bin", + "model.layers.16.mlp.up_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.post_attention_layernorm.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.16.self_attn.k_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.o_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.q_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.rotary_emb.inv_freq": "pytorch_model-00033-of-00082.bin", + "model.layers.16.self_attn.v_proj.weight": "pytorch_model-00033-of-00082.bin", + "model.layers.17.input_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.mlp.down_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.gate_proj.weight": "pytorch_model-00036-of-00082.bin", + "model.layers.17.mlp.up_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.post_attention_layernorm.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.17.self_attn.k_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.o_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.q_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.rotary_emb.inv_freq": "pytorch_model-00035-of-00082.bin", + "model.layers.17.self_attn.v_proj.weight": "pytorch_model-00035-of-00082.bin", + "model.layers.18.input_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.mlp.down_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.gate_proj.weight": "pytorch_model-00038-of-00082.bin", + "model.layers.18.mlp.up_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.post_attention_layernorm.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.18.self_attn.k_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.o_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.q_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.rotary_emb.inv_freq": "pytorch_model-00037-of-00082.bin", + "model.layers.18.self_attn.v_proj.weight": "pytorch_model-00037-of-00082.bin", + "model.layers.19.input_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.mlp.down_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.gate_proj.weight": "pytorch_model-00040-of-00082.bin", + "model.layers.19.mlp.up_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.post_attention_layernorm.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.19.self_attn.k_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.o_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.q_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.rotary_emb.inv_freq": "pytorch_model-00039-of-00082.bin", + "model.layers.19.self_attn.v_proj.weight": "pytorch_model-00039-of-00082.bin", + "model.layers.2.input_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.mlp.down_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.gate_proj.weight": "pytorch_model-00006-of-00082.bin", + "model.layers.2.mlp.up_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.post_attention_layernorm.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.2.self_attn.k_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.o_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.q_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.rotary_emb.inv_freq": "pytorch_model-00005-of-00082.bin", + "model.layers.2.self_attn.v_proj.weight": "pytorch_model-00005-of-00082.bin", + "model.layers.20.input_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.mlp.down_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.gate_proj.weight": "pytorch_model-00042-of-00082.bin", + "model.layers.20.mlp.up_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.post_attention_layernorm.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.20.self_attn.k_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.o_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.q_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.rotary_emb.inv_freq": "pytorch_model-00041-of-00082.bin", + "model.layers.20.self_attn.v_proj.weight": "pytorch_model-00041-of-00082.bin", + "model.layers.21.input_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.mlp.down_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.gate_proj.weight": "pytorch_model-00044-of-00082.bin", + "model.layers.21.mlp.up_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.post_attention_layernorm.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.21.self_attn.k_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.o_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.q_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.rotary_emb.inv_freq": "pytorch_model-00043-of-00082.bin", + "model.layers.21.self_attn.v_proj.weight": "pytorch_model-00043-of-00082.bin", + "model.layers.22.input_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.mlp.down_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.gate_proj.weight": "pytorch_model-00046-of-00082.bin", + "model.layers.22.mlp.up_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.post_attention_layernorm.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.22.self_attn.k_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.rotary_emb.inv_freq": "pytorch_model-00045-of-00082.bin", + "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00045-of-00082.bin", + "model.layers.23.input_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.mlp.down_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00048-of-00082.bin", + "model.layers.23.mlp.up_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.rotary_emb.inv_freq": "pytorch_model-00047-of-00082.bin", + "model.layers.23.self_attn.v_proj.weight": "pytorch_model-00047-of-00082.bin", + "model.layers.24.input_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.mlp.down_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.gate_proj.weight": "pytorch_model-00050-of-00082.bin", + "model.layers.24.mlp.up_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.post_attention_layernorm.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.24.self_attn.k_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.o_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.q_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.rotary_emb.inv_freq": "pytorch_model-00049-of-00082.bin", + "model.layers.24.self_attn.v_proj.weight": "pytorch_model-00049-of-00082.bin", + "model.layers.25.input_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.mlp.down_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.gate_proj.weight": "pytorch_model-00052-of-00082.bin", + "model.layers.25.mlp.up_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.post_attention_layernorm.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.25.self_attn.k_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.o_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.q_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.rotary_emb.inv_freq": "pytorch_model-00051-of-00082.bin", + "model.layers.25.self_attn.v_proj.weight": "pytorch_model-00051-of-00082.bin", + "model.layers.26.input_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.mlp.down_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.gate_proj.weight": "pytorch_model-00054-of-00082.bin", + "model.layers.26.mlp.up_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.post_attention_layernorm.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.26.self_attn.k_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.o_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.q_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.rotary_emb.inv_freq": "pytorch_model-00053-of-00082.bin", + "model.layers.26.self_attn.v_proj.weight": "pytorch_model-00053-of-00082.bin", + "model.layers.27.input_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.mlp.down_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.gate_proj.weight": "pytorch_model-00056-of-00082.bin", + "model.layers.27.mlp.up_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.post_attention_layernorm.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.27.self_attn.k_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.o_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.q_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.rotary_emb.inv_freq": "pytorch_model-00055-of-00082.bin", + "model.layers.27.self_attn.v_proj.weight": "pytorch_model-00055-of-00082.bin", + "model.layers.28.input_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.mlp.down_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.gate_proj.weight": "pytorch_model-00058-of-00082.bin", + "model.layers.28.mlp.up_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.post_attention_layernorm.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.28.self_attn.k_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.o_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.q_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.rotary_emb.inv_freq": "pytorch_model-00057-of-00082.bin", + "model.layers.28.self_attn.v_proj.weight": "pytorch_model-00057-of-00082.bin", + "model.layers.29.input_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.mlp.down_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.gate_proj.weight": "pytorch_model-00060-of-00082.bin", + "model.layers.29.mlp.up_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.post_attention_layernorm.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.29.self_attn.k_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.o_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.q_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.rotary_emb.inv_freq": "pytorch_model-00059-of-00082.bin", + "model.layers.29.self_attn.v_proj.weight": "pytorch_model-00059-of-00082.bin", + "model.layers.3.input_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.mlp.down_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.gate_proj.weight": "pytorch_model-00008-of-00082.bin", + "model.layers.3.mlp.up_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.post_attention_layernorm.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.3.self_attn.k_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.o_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.q_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.rotary_emb.inv_freq": "pytorch_model-00007-of-00082.bin", + "model.layers.3.self_attn.v_proj.weight": "pytorch_model-00007-of-00082.bin", + "model.layers.30.input_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.mlp.down_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.gate_proj.weight": "pytorch_model-00062-of-00082.bin", + "model.layers.30.mlp.up_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.post_attention_layernorm.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.30.self_attn.k_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.o_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.q_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.rotary_emb.inv_freq": "pytorch_model-00061-of-00082.bin", + "model.layers.30.self_attn.v_proj.weight": "pytorch_model-00061-of-00082.bin", + "model.layers.31.input_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.mlp.down_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.gate_proj.weight": "pytorch_model-00064-of-00082.bin", + "model.layers.31.mlp.up_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.post_attention_layernorm.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.31.self_attn.k_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.o_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.q_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.rotary_emb.inv_freq": "pytorch_model-00063-of-00082.bin", + "model.layers.31.self_attn.v_proj.weight": "pytorch_model-00063-of-00082.bin", + "model.layers.32.input_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.mlp.down_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.gate_proj.weight": "pytorch_model-00066-of-00082.bin", + "model.layers.32.mlp.up_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.post_attention_layernorm.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.32.self_attn.k_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.o_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.q_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.rotary_emb.inv_freq": "pytorch_model-00065-of-00082.bin", + "model.layers.32.self_attn.v_proj.weight": "pytorch_model-00065-of-00082.bin", + "model.layers.33.input_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.mlp.down_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.gate_proj.weight": "pytorch_model-00068-of-00082.bin", + "model.layers.33.mlp.up_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.post_attention_layernorm.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.33.self_attn.k_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.o_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.q_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.rotary_emb.inv_freq": "pytorch_model-00067-of-00082.bin", + "model.layers.33.self_attn.v_proj.weight": "pytorch_model-00067-of-00082.bin", + "model.layers.34.input_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.mlp.down_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.gate_proj.weight": "pytorch_model-00070-of-00082.bin", + "model.layers.34.mlp.up_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.post_attention_layernorm.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.34.self_attn.k_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.o_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.q_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.rotary_emb.inv_freq": "pytorch_model-00069-of-00082.bin", + "model.layers.34.self_attn.v_proj.weight": "pytorch_model-00069-of-00082.bin", + "model.layers.35.input_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.mlp.down_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.gate_proj.weight": "pytorch_model-00072-of-00082.bin", + "model.layers.35.mlp.up_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.post_attention_layernorm.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.35.self_attn.k_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.o_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.q_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.rotary_emb.inv_freq": "pytorch_model-00071-of-00082.bin", + "model.layers.35.self_attn.v_proj.weight": "pytorch_model-00071-of-00082.bin", + "model.layers.36.input_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.mlp.down_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.gate_proj.weight": "pytorch_model-00074-of-00082.bin", + "model.layers.36.mlp.up_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.post_attention_layernorm.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.36.self_attn.k_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.o_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.q_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.rotary_emb.inv_freq": "pytorch_model-00073-of-00082.bin", + "model.layers.36.self_attn.v_proj.weight": "pytorch_model-00073-of-00082.bin", + "model.layers.37.input_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.mlp.down_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.gate_proj.weight": "pytorch_model-00076-of-00082.bin", + "model.layers.37.mlp.up_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.post_attention_layernorm.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.37.self_attn.k_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.o_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.q_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.rotary_emb.inv_freq": "pytorch_model-00075-of-00082.bin", + "model.layers.37.self_attn.v_proj.weight": "pytorch_model-00075-of-00082.bin", + "model.layers.38.input_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.mlp.down_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.gate_proj.weight": "pytorch_model-00078-of-00082.bin", + "model.layers.38.mlp.up_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.post_attention_layernorm.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.38.self_attn.k_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.o_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.q_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.rotary_emb.inv_freq": "pytorch_model-00077-of-00082.bin", + "model.layers.38.self_attn.v_proj.weight": "pytorch_model-00077-of-00082.bin", + "model.layers.39.input_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.mlp.down_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.gate_proj.weight": "pytorch_model-00080-of-00082.bin", + "model.layers.39.mlp.up_proj.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.post_attention_layernorm.weight": "pytorch_model-00081-of-00082.bin", + "model.layers.39.self_attn.k_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.o_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.q_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.rotary_emb.inv_freq": "pytorch_model-00079-of-00082.bin", + "model.layers.39.self_attn.v_proj.weight": "pytorch_model-00079-of-00082.bin", + "model.layers.4.input_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.mlp.down_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.gate_proj.weight": "pytorch_model-00010-of-00082.bin", + "model.layers.4.mlp.up_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.post_attention_layernorm.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.4.self_attn.k_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.o_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.q_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.rotary_emb.inv_freq": "pytorch_model-00009-of-00082.bin", + "model.layers.4.self_attn.v_proj.weight": "pytorch_model-00009-of-00082.bin", + "model.layers.5.input_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.mlp.down_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.gate_proj.weight": "pytorch_model-00012-of-00082.bin", + "model.layers.5.mlp.up_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.post_attention_layernorm.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.5.self_attn.k_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.o_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.q_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.rotary_emb.inv_freq": "pytorch_model-00011-of-00082.bin", + "model.layers.5.self_attn.v_proj.weight": "pytorch_model-00011-of-00082.bin", + "model.layers.6.input_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.mlp.down_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.gate_proj.weight": "pytorch_model-00014-of-00082.bin", + "model.layers.6.mlp.up_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.post_attention_layernorm.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.6.self_attn.k_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.o_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.q_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.rotary_emb.inv_freq": "pytorch_model-00013-of-00082.bin", + "model.layers.6.self_attn.v_proj.weight": "pytorch_model-00013-of-00082.bin", + "model.layers.7.input_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.mlp.down_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.gate_proj.weight": "pytorch_model-00016-of-00082.bin", + "model.layers.7.mlp.up_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.post_attention_layernorm.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.7.self_attn.k_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.o_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.q_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.rotary_emb.inv_freq": "pytorch_model-00015-of-00082.bin", + "model.layers.7.self_attn.v_proj.weight": "pytorch_model-00015-of-00082.bin", + "model.layers.8.input_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.mlp.down_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.gate_proj.weight": "pytorch_model-00018-of-00082.bin", + "model.layers.8.mlp.up_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.post_attention_layernorm.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.8.self_attn.k_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.o_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.q_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.rotary_emb.inv_freq": "pytorch_model-00017-of-00082.bin", + "model.layers.8.self_attn.v_proj.weight": "pytorch_model-00017-of-00082.bin", + "model.layers.9.input_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.mlp.down_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.gate_proj.weight": "pytorch_model-00020-of-00082.bin", + "model.layers.9.mlp.up_proj.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.post_attention_layernorm.weight": "pytorch_model-00021-of-00082.bin", + "model.layers.9.self_attn.k_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.o_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.q_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.rotary_emb.inv_freq": "pytorch_model-00019-of-00082.bin", + "model.layers.9.self_attn.v_proj.weight": "pytorch_model-00019-of-00082.bin", + "model.norm.weight": "pytorch_model-00081-of-00082.bin" + } +}