diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52373fe24473b1aa44333d318f578ae6bf04b49b 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/config.json b/config.json new file mode 100644 index 0000000000000000000000000000000000000000..82f5e0aafc3f20384a827dc4ff8e919f02dc3756 --- /dev/null +++ b/config.json @@ -0,0 +1,36 @@ +{ + "_name_or_path": "/oe-adapt-default/costah/models/405B_finetune_successful", + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": 128001, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 16384, + "initializer_range": 0.02, + "intermediate_size": 53248, + "max_position_embeddings": 131072, + "mlp_bias": false, + "model_type": "llama", + "num_attention_heads": 128, + "num_hidden_layers": 126, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.47.1", + "use_cache": true, + "vocab_size": 128264 +} diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000000000000000000000000000000000000..41de1af1b10386ca8193ae61bdb014263a2402e1 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,9 @@ +{ + "_from_model_config": true, + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": 128001, + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "4.47.1" +} diff --git a/metadata.json b/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4f3699b1ad213bccfdfb47b510140b4a8838444c --- /dev/null +++ b/metadata.json @@ -0,0 +1 @@ +{"model_name": "dpo_tune_cache", "model_type": "dpo", "datasets": ["ai2-adapt-dev/405b_preference_mix"], "base_model": "/oe-adapt-default/costah/models/405B_finetune_successful", "wandb_path": "https://wandb.ai/ai2-llm/open_instruct_internal/runs/v1rhfn1m", "beaker_experiment": "https://beaker.org/ex/01JJ4QRZ31SH79AHVM6WWDVJB4/", "beaker_datasets": ["https://beaker.org/ds/01JJ4QRZ4X8RKSGP939745BWPP", "https://beaker.org/ds/01JJ4QRZA364S625K42YEJC471", "https://beaker.org/ds/01JJ4QRZF5AKF5JXS7G79CTWXH", "https://beaker.org/ds/01JJ4QRZMBXP67FBN3MKYB90M8", "https://beaker.org/ds/01JJ4QRZT9PHZ1TD216TKNZ0C0", "https://beaker.org/ds/01JJ4QS000A3V672TFZHRBCSFE", "https://beaker.org/ds/01JJ4QS04TZM482VA9A9QV04H5", "https://beaker.org/ds/01JJ4QS09J57HA4XP2TAYJMBHY", "https://beaker.org/ds/01JJ4QS0F18PHA5Y44W1TCTK1N", "https://beaker.org/ds/01JJ4QS0KZK07C8JKQQ39JZADN", "https://beaker.org/ds/01JJ4QS0STGPH2151E331EWJR7", "https://beaker.org/ds/01JJ4QS0Z26WZD9131ZTDMCSM7", "https://beaker.org/ds/01JJ4QS157W1A3J9VD2WYX7DRN", "https://beaker.org/ds/01JJ4QS1BVQKR41YH4G5JC9NQ3", "https://beaker.org/ds/01JJ4QS1H1KM8XBQXWAR3RCTXA", "https://beaker.org/ds/01JJ4QS1Q0TS69T26BTETH3MTH", "https://beaker.org/ds/01JJ4QS1W1QEES6EQMK4RHA5S8", "https://beaker.org/ds/01JJ4QS213SH8VF4CYWKHKCGF0", "https://beaker.org/ds/01JJ4QS25TY2JCKAK423RHYCWX", "https://beaker.org/ds/01JJ4QS2AN2XMTDDTEMTYGNPAC", "https://beaker.org/ds/01JJ4QS2FMJTDNSPXW953KS7VB", "https://beaker.org/ds/01JJ4QS2N7K26FJZXJ9QE6A9X2", "https://beaker.org/ds/01JJ4QS2T9TW1ZZT1E5TWYZP4D", "https://beaker.org/ds/01JJ4QS2Z8HPSPAT47TCH4VK6A", "https://beaker.org/ds/01JJ4QS346VN1D1Y67GAAX5TC7", "https://beaker.org/ds/01JJ4QS391HH9PVZMZZC1GSGSY", "https://beaker.org/ds/01JJ4QS3E2NSTJ2XF2R5VQFF7M", "https://beaker.org/ds/01JJ4QS3K0V50J4FNVPQZRA74K", "https://beaker.org/ds/01JJ4QS3QTH2CQM8ERMKTFC8H2", "https://beaker.org/ds/01JJ4QS3WS89MVZRK50NE3WRM2", "https://beaker.org/ds/01JJ4QS41QJ2CSVZQJE0KHC75X", "https://beaker.org/ds/01JJ4QS46SGE41SRG0XYQ6TY63"]} \ No newline at end of file diff --git a/pytorch_model-00001-of-00191.bin b/pytorch_model-00001-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..e7f13ab92d7b9624ca3ddc2e885bf7aabb8bce21 --- /dev/null +++ b/pytorch_model-00001-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2e1c55a115e9bf0b130ead654afad71b768b775ba1a05378d2c0d3ab3a1618 +size 4806936944 diff --git a/pytorch_model-00002-of-00191.bin b/pytorch_model-00002-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f49099f59ada95b457f5ff11439c719265043dc2 --- /dev/null +++ b/pytorch_model-00002-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41d00ad652a37a9bedc0d483688bf65f69e293df8842056ca53ab46978fc476d +size 4026533863 diff --git a/pytorch_model-00004-of-00191.bin b/pytorch_model-00004-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7881b136973377004e8d270f5164536ea8e32b4 --- /dev/null +++ b/pytorch_model-00004-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0756f79c6675ed23fcf171c49489a14375139a758a3464b7d9f42877855eefa +size 4630580764 diff --git a/pytorch_model-00005-of-00191.bin b/pytorch_model-00005-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..629b2d67ee9c89722969dbd2e87b68685000dbf5 --- /dev/null +++ b/pytorch_model-00005-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4311d860602a353eb2ba3b8729cfea97a1ba353606a277a4a088942f6be6749 +size 3489662678 diff --git a/pytorch_model-00006-of-00191.bin b/pytorch_model-00006-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..209eb835935bb5169f5a7ab6ce802e7ad25fef06 --- /dev/null +++ b/pytorch_model-00006-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f8c7cd3715c92da69508e3fc7ef211ffb9320176c24154481afe75c1643c196 +size 4630580764 diff --git a/pytorch_model-00007-of-00191.bin b/pytorch_model-00007-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..de7e3a7dee1d61830740eb5187a83126dc375846 --- /dev/null +++ b/pytorch_model-00007-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e4642c4594b880e48d1a5d4b933f487f549bb73b32522d4b91b71e2a4c52e3 +size 4630580764 diff --git a/pytorch_model-00009-of-00191.bin b/pytorch_model-00009-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..c806710b1a2285980e01a31fd9d6a2b1aed8f4a7 --- /dev/null +++ b/pytorch_model-00009-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2138106cb4a6c264e5017510adfa2960b684f9d6d023353bf75ac3e4a796db69 +size 4630580764 diff --git a/pytorch_model-00010-of-00191.bin b/pytorch_model-00010-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..44be3e8ff05fd5b3220a57156d3bfac3aa0c0d95 --- /dev/null +++ b/pytorch_model-00010-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a64bb8fb16aa2c6a04776fa15fdccdd70c773a59e87882a1b361703b7275ba2 +size 4630580764 diff --git a/pytorch_model-00011-of-00191.bin b/pytorch_model-00011-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..726ee8c5057840b37bc130775b82637d74d6a40f --- /dev/null +++ b/pytorch_model-00011-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab5b34a0d4db6b0ee8b1ce33e57eefaa358e4fbe6f19394af76a8a3dcc23b7e7 +size 3489662678 diff --git a/pytorch_model-00012-of-00191.bin b/pytorch_model-00012-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..fb725ad6d37b861f8612df211038c64e97f47fbb --- /dev/null +++ b/pytorch_model-00012-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe45e6274d71626231412097a292e50adbb587785dce0e6147f47f834367901 +size 4630580764 diff --git a/pytorch_model-00013-of-00191.bin b/pytorch_model-00013-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..7757b72d8869dfc9ed61024d351dfd9c03e12a2a --- /dev/null +++ b/pytorch_model-00013-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc3cafdf2601dfd2d7f153c06053f08fa0b130232d8c3b0d33e34d992e6c2e3 +size 4630580764 diff --git a/pytorch_model-00014-of-00191.bin b/pytorch_model-00014-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b69e88778a7c8dcc8f1a487d015b250a27fea1e5 --- /dev/null +++ b/pytorch_model-00014-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:726a80237b9b945e46a5d762b144500bc2a37bcb1a9c8a97b28b387aa8b7f63c +size 3489662678 diff --git a/pytorch_model-00015-of-00191.bin b/pytorch_model-00015-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa17723d9804250eb5ae2aaae694ca4d9f7bd844 --- /dev/null +++ b/pytorch_model-00015-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5eb54ddb4b3a5d64b8394d3adc94bc1cc63ca115cf3ff2cc9e0d421b3b2a4bf +size 4630580764 diff --git a/pytorch_model-00019-of-00191.bin b/pytorch_model-00019-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..08d20455634debcbe1e2a87f789591c412f68549 --- /dev/null +++ b/pytorch_model-00019-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea003813af99a76b754d215274f41bd6967b5c195000ccf321ef6438eb253c6 +size 4630580764 diff --git a/pytorch_model-00020-of-00191.bin b/pytorch_model-00020-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..993c0417d96af5f9410d8c991408bf01131226d1 --- /dev/null +++ b/pytorch_model-00020-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d261ca85e50871964f3b00925f9c8135a475c91157159dcbef6b4ae91570eb9 +size 3489662678 diff --git a/pytorch_model-00022-of-00191.bin b/pytorch_model-00022-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0eb617b94c271a36ceffca8f62ca662b9c829f7 --- /dev/null +++ b/pytorch_model-00022-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f68f15c2a98eb49e7b3d9e42473778b558347a4a509c3a1b752af2fd16de47 +size 4630580764 diff --git a/pytorch_model-00023-of-00191.bin b/pytorch_model-00023-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..8dfa2832a4b2a7234939b11df9f165edcef40cca --- /dev/null +++ b/pytorch_model-00023-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b669b9f7388bc28e9e3223d96901e69d586fd90bac6f7834c6cfb82c713a2acf +size 3489662678 diff --git a/pytorch_model-00024-of-00191.bin b/pytorch_model-00024-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..9af4a330a6f1e80b587b55808d8e2b14b3c5f471 --- /dev/null +++ b/pytorch_model-00024-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970949fe23424bc3af8c62e0d46439a0cb09fc1974f9f1ee0db355d7122d4d11 +size 4630580764 diff --git a/pytorch_model-00025-of-00191.bin b/pytorch_model-00025-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..fb9e3c9ac7f866c766c1fdd6f774412431bfdcb5 --- /dev/null +++ b/pytorch_model-00025-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0f9dde38b78e02a346d828c1bfadd6cc477536561a42ed8c674041de0bf0fce +size 4630580764 diff --git a/pytorch_model-00026-of-00191.bin b/pytorch_model-00026-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f027dfd440237dd4f00393c9388d2f78afa019ee --- /dev/null +++ b/pytorch_model-00026-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf925bc9b7935acda05d4d8ec27cc42ffe6e2a24f9c21594ae31b7e0f5dca78 +size 3489662678 diff --git a/pytorch_model-00027-of-00191.bin b/pytorch_model-00027-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..da75b41f9889d6d906155b22ec5013cb16e28f76 --- /dev/null +++ b/pytorch_model-00027-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81223042ce073e05edf45f6deecab302fd2eab92f8b2d4ec07d3b6805ce7072 +size 4630580764 diff --git a/pytorch_model-00028-of-00191.bin b/pytorch_model-00028-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3381c9edeac62002bfa5330d1b7fcdf9090bd36 --- /dev/null +++ b/pytorch_model-00028-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c93d6abaa734fdc04e1f1e863442d647191f538102c0990840678bd12766387 +size 4630580764 diff --git a/pytorch_model-00029-of-00191.bin b/pytorch_model-00029-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..a44d4e7bfb064e27579d50d7705352dec9f76f56 --- /dev/null +++ b/pytorch_model-00029-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d715dd48b381d0c657be234d775309884d7145917202f1dd9ae2e2cf1fe59adb +size 3489662678 diff --git a/pytorch_model-00030-of-00191.bin b/pytorch_model-00030-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..bff9933b24cdda2ac390ac2f0d5efe7eabaefdb5 --- /dev/null +++ b/pytorch_model-00030-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a62e9f2f3c095d483ec7c9bd72d8005b3e8b7f0792aaf56e779eaedb6a8ce6 +size 4630580764 diff --git a/pytorch_model-00031-of-00191.bin b/pytorch_model-00031-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b91d48b2bfec20b87cf65322cf50180ba146ad83 --- /dev/null +++ b/pytorch_model-00031-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c04437c59a1e8ac05ed521d218048f2973aacacdf7beffb34b2b474c0bf6cc18 +size 4630580764 diff --git a/pytorch_model-00032-of-00191.bin b/pytorch_model-00032-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c5310346b81b63e8ad0a7ad1c21d4f824c6c8ef --- /dev/null +++ b/pytorch_model-00032-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:528606b66c020948a4c2a9c0ca9b1e8b1ac3f6f4da9ccc04b55f760a4ad5817e +size 3489662678 diff --git a/pytorch_model-00034-of-00191.bin b/pytorch_model-00034-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..7038f580fbff9da7a4f2c61ab90b6c84a9107ffd --- /dev/null +++ b/pytorch_model-00034-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608be02773ec1d3d70f37743fe63c6ecea2bdd7b6854ee605e8db2805bbfa955 +size 4630580764 diff --git a/pytorch_model-00035-of-00191.bin b/pytorch_model-00035-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5f6d9c0a4ed84ebe4c79f649f3fac77c8d08972 --- /dev/null +++ b/pytorch_model-00035-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5692b5cf6b8cc8298637519e1424555ff2adfdedadd093f0bcc0b3241e1c1b1d +size 3489662678 diff --git a/pytorch_model-00036-of-00191.bin b/pytorch_model-00036-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..65f5b5977b5cc04f3d11d7ea4943385df1a956ec --- /dev/null +++ b/pytorch_model-00036-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ddbd672d526b6af200fb8fbc05165e75cd05b8f2e205acc6d7851b08fd6f68d +size 4630580764 diff --git a/pytorch_model-00037-of-00191.bin b/pytorch_model-00037-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..e64148fad005b69b8a2ec2ca890be076319f258a --- /dev/null +++ b/pytorch_model-00037-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f34357c32670c97c6eb57e36c3222d43d959346e53c0b1f147265ff40a2a62 +size 4630580764 diff --git a/pytorch_model-00038-of-00191.bin b/pytorch_model-00038-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..46234a831c02a83fc7cc3c0d78675a356f245ad7 --- /dev/null +++ b/pytorch_model-00038-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a87c119ab700c934d26908869000a0d83dd786a02b92c7751c8ae4f943dcc841 +size 3489662678 diff --git a/pytorch_model-00039-of-00191.bin b/pytorch_model-00039-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..05c7fa4e0e2f801a27c0da25e861d550b60f0469 --- /dev/null +++ b/pytorch_model-00039-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3876548388777f52ea7dbf3a2e513f2f140e2f7cd1def3e2be612a24e9e4ffaf +size 4630580764 diff --git a/pytorch_model-00040-of-00191.bin b/pytorch_model-00040-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..249eacf6389002758a8bc82408860f0f3bead1a2 --- /dev/null +++ b/pytorch_model-00040-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38b5b3c9569f7c7d285b25b44a8fff9e210f8018d3ed72db9de8d502923c6bd1 +size 4630580764 diff --git a/pytorch_model-00041-of-00191.bin b/pytorch_model-00041-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1e4a5b0f6e6d5f2bff9c9af78d52fdda2aac767 --- /dev/null +++ b/pytorch_model-00041-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b778bace05ca621c3ac006b9c22953546078181524708efd1097c733d55cbca6 +size 3489662678 diff --git a/pytorch_model-00044-of-00191.bin b/pytorch_model-00044-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f3c3125da424fc8fb7b7f0ee85723884b2ac166 --- /dev/null +++ b/pytorch_model-00044-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5365eb67d76a5f907a26556de48f3cdfb9aa2158ab0b265582ead7535e823ab +size 3489662678 diff --git a/pytorch_model-00046-of-00191.bin b/pytorch_model-00046-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f15b02da7af3f79f5fee80411ca60e982d6380f --- /dev/null +++ b/pytorch_model-00046-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:760b07e00973ccf38e9b384eb8835dc93f2f68c2713a0fb3dc479e548d47c4bb +size 4630580764 diff --git a/pytorch_model-00047-of-00191.bin b/pytorch_model-00047-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..73c01454d3a65364b9e80cfdce03a9ab4820ad8c --- /dev/null +++ b/pytorch_model-00047-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96610c0c7c300ca77e2dbfb20366ca363aa0b7b015be5e118d191420d7527758 +size 3489662678 diff --git a/pytorch_model-00048-of-00191.bin b/pytorch_model-00048-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..3920305ee28742198a88d6dc044afe9cdea9d5eb --- /dev/null +++ b/pytorch_model-00048-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b391de2d50d08c9f39fad63fd7568c47898a83420a90856ebde6a92a0cedfe5 +size 4630580764 diff --git a/pytorch_model-00049-of-00191.bin b/pytorch_model-00049-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..08b2469f259f0564ee8b02449983ba0d18a1f503 --- /dev/null +++ b/pytorch_model-00049-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75163f3075a0fc1a3b35e4b936d8b1228a0137d0bc389eb862567fd7701584a4 +size 4630580764 diff --git a/pytorch_model-00050-of-00191.bin b/pytorch_model-00050-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0716ef658f5d956b58a6e9159344f8d7679dbcd --- /dev/null +++ b/pytorch_model-00050-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d1267940808131c25f245150994ad530ab62415d0a6d6c2d518700073b793b5 +size 3489662678 diff --git a/pytorch_model-00051-of-00191.bin b/pytorch_model-00051-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..a19530d8b124ccb20774cfefdb99b300ec2b8c9a --- /dev/null +++ b/pytorch_model-00051-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d234755c451728060a4bd4ee790646826e5702ac9bed38fe6530e419f0133121 +size 4630580764 diff --git a/pytorch_model-00054-of-00191.bin b/pytorch_model-00054-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..0f6d31d747f6a650c1f44b67aa15abed32f20dc4 --- /dev/null +++ b/pytorch_model-00054-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c298c52d93a8fe4006fc02e9a1d670f74163c3a9c968d71c8c6db7005a02faf +size 4630580764 diff --git a/pytorch_model-00055-of-00191.bin b/pytorch_model-00055-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b3b4849c43e818678a87374dbfa0a8248b4de1c8 --- /dev/null +++ b/pytorch_model-00055-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcd2a3695cac6af9b5deef7793e45e0f6492264a1b8a7cc16e3426bd50582dab +size 4630580764 diff --git a/pytorch_model-00056-of-00191.bin b/pytorch_model-00056-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..21223491ad880e4dac9eae0e2d03485dd9cbbd24 --- /dev/null +++ b/pytorch_model-00056-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc841bb02a948c5a857a5782cabe00b70fe4b4ab79d008ba1e34fb698dce7be +size 3489662678 diff --git a/pytorch_model-00057-of-00191.bin b/pytorch_model-00057-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..2eb5cf03a703f7e00c64fcf297443cff5ae62121 --- /dev/null +++ b/pytorch_model-00057-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f91db550d033a9bfed60e7c8a0b46722b943acc579d408599498210b562f82e0 +size 4630580764 diff --git a/pytorch_model-00058-of-00191.bin b/pytorch_model-00058-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..a93f171e617ef7655be19b49aab0b2ab62f6e050 --- /dev/null +++ b/pytorch_model-00058-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82f39bc4cfce7039562b07229f39edb08c6519999b52fd6db8af3a5b9743c4f +size 4630580764 diff --git a/pytorch_model-00059-of-00191.bin b/pytorch_model-00059-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..daf1faa95761bb5a493f74e8b73f3e8e5d40268d --- /dev/null +++ b/pytorch_model-00059-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40a04c30c190d4af143728976872d1e5295d054ffb489f759592a6bd4682b903 +size 3489662678 diff --git a/pytorch_model-00061-of-00191.bin b/pytorch_model-00061-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..9815a5bab513f92d68680c278a838d103484ef6a --- /dev/null +++ b/pytorch_model-00061-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2df42ade4698fbbd9b20dbe0ea3d67f09cffd5656afc4ba89eb13ea98b66ad59 +size 4630580764 diff --git a/pytorch_model-00062-of-00191.bin b/pytorch_model-00062-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..058dbe3b0f8190106522f1ec598cfab0e395ebe4 --- /dev/null +++ b/pytorch_model-00062-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e3e37c6517980e314004b7be85227a534b398185c6da2e034d34d2c909839e1 +size 3489662678 diff --git a/pytorch_model-00063-of-00191.bin b/pytorch_model-00063-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..fd45cafe85eaacd2dba38d3849790f1c80929d17 --- /dev/null +++ b/pytorch_model-00063-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed18f13327a3339a299901fa74099f200f6249c01f62bef6485c09d99374c82 +size 4630580764 diff --git a/pytorch_model-00064-of-00191.bin b/pytorch_model-00064-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..5fdaf7dec9156c4d313dbce60e84d696dca83f8d --- /dev/null +++ b/pytorch_model-00064-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac8233a307f287e44f5034c15edfa18a7ceb298ea2949510294fc5676fe0df5 +size 4630580764 diff --git a/pytorch_model-00065-of-00191.bin b/pytorch_model-00065-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..0bee932c40d2d0973302ef2d1a2382d64a7206d8 --- /dev/null +++ b/pytorch_model-00065-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee1ccee34c0bed11ef08ba51fbb184af3ee0ffc9663c7c70c2855d595cc09d6 +size 3489662678 diff --git a/pytorch_model-00066-of-00191.bin b/pytorch_model-00066-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c98265524dc9db6f30b6034b8fd10c8452f26d4 --- /dev/null +++ b/pytorch_model-00066-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3437c5f71d7dc917efb2ad9c7d7ec2d648f26cc424b26b6c7056e1ec9e7acff7 +size 4630580764 diff --git a/pytorch_model-00068-of-00191.bin b/pytorch_model-00068-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..ccc5e9f381f6d9415e3e17635a5d68b37f4f896e --- /dev/null +++ b/pytorch_model-00068-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88e818d937234b95e3b2fbad48d4ff3837397d7d03fc88972d728827c9292161 +size 3489662678 diff --git a/pytorch_model-00070-of-00191.bin b/pytorch_model-00070-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..d91f53b1b7a5cb874aaf7b7664823d7a9536fe46 --- /dev/null +++ b/pytorch_model-00070-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d002702f9a36a8775973ac82db70927a74058df0bb3a42c07751df885363cb +size 4630580764 diff --git a/pytorch_model-00071-of-00191.bin b/pytorch_model-00071-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..3012705f8c599b013660ff121e292ef3df5df150 --- /dev/null +++ b/pytorch_model-00071-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af02a37609b3518ebbdc9184df64e28e4eb65d1b31ca541359f11c7bef6eb86d +size 3489662678 diff --git a/pytorch_model-00072-of-00191.bin b/pytorch_model-00072-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..66d87e52d0361501513d39b3b23afc3de1c83196 --- /dev/null +++ b/pytorch_model-00072-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c72571cfc31f24e0cb4c42d53f869223017a9380398f83f61d0d901521acb410 +size 4630580764 diff --git a/pytorch_model-00074-of-00191.bin b/pytorch_model-00074-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3cb36a213f3b2ab4133c5639e32824794513d0b --- /dev/null +++ b/pytorch_model-00074-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:832ee060ee9da2b9b58eda8ab0783c5bb401e9196ff0672026f3be514bf18c11 +size 3489662678 diff --git a/pytorch_model-00076-of-00191.bin b/pytorch_model-00076-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..e447afe430ffaf44acd6c97cd3bd08a2dc2133fe --- /dev/null +++ b/pytorch_model-00076-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:575b1345bf48c250d36a5ae1c6fbc8249725417376ff085110a675e748534250 +size 4630580764 diff --git a/pytorch_model-00077-of-00191.bin b/pytorch_model-00077-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..121588e0f8c13d7d7266a0c5b456f470c91da71c --- /dev/null +++ b/pytorch_model-00077-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80eb25e08de1ef893586059a1de4ee4d92732d577c09a8b1e99d847e194078ee +size 3489662678 diff --git a/pytorch_model-00080-of-00191.bin b/pytorch_model-00080-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..6737ef5dffc0aa5404773e15c4922a235170e283 --- /dev/null +++ b/pytorch_model-00080-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd22484ffa9863f64b9c6ca089f801aceff3661a99c0e129c554113be9f8eabf +size 3489662678 diff --git a/pytorch_model-00081-of-00191.bin b/pytorch_model-00081-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..598de458793237e16b1a1d0993463349dfcbd91f --- /dev/null +++ b/pytorch_model-00081-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c530e88966cac407fcbf765e02abcfbf10aab6468c3127e68b5365e4703d1fbc +size 4630580764 diff --git a/pytorch_model-00083-of-00191.bin b/pytorch_model-00083-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f8d9bd5a97ac3d014fc9ed9ef34a4a4dc4c3cee2 --- /dev/null +++ b/pytorch_model-00083-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d73da7c066904482d591f4c174c079c2b7502985f6484e9213618699f27f5b8c +size 3489662678 diff --git a/pytorch_model-00084-of-00191.bin b/pytorch_model-00084-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b8f67ebdc217b2c75ea2d6b60313595fee991f42 --- /dev/null +++ b/pytorch_model-00084-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e66753d2f91a93b1482edcb88582d15ad58c389c8e9115308699d83f8469f655 +size 4630580764 diff --git a/pytorch_model-00086-of-00191.bin b/pytorch_model-00086-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f955fbdafa81fa65e3b3780ba5e86ca1bae7d1d5 --- /dev/null +++ b/pytorch_model-00086-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54c6eb79cf32d161aa07de60f26c0d2edde1c933d5d8c00da84913e3f18ade33 +size 3489662678 diff --git a/pytorch_model-00087-of-00191.bin b/pytorch_model-00087-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..44544ec60e986f92edd85cb3e3aa9ab284ab2a24 --- /dev/null +++ b/pytorch_model-00087-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee46b0b6b6c9688a64b9d1547ce3785114183d18827ce4f5f65d9670c0a74bbd +size 4630580764 diff --git a/pytorch_model-00089-of-00191.bin b/pytorch_model-00089-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..371082a3489d5d6d0062a52730a0281c13a571d7 --- /dev/null +++ b/pytorch_model-00089-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44d728047671eebd4f51cdf350ff0b9b650f3d2487ab826e49925a81e11146d +size 3489662678 diff --git a/pytorch_model-00090-of-00191.bin b/pytorch_model-00090-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..1a7c8ae8948cb9ad00d6dce6c229ce5006269151 --- /dev/null +++ b/pytorch_model-00090-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce425aeb7b655d4b329c0c898f1c3d5e8511d2dc7d3686a1b89292f986217977 +size 4630580764 diff --git a/pytorch_model-00091-of-00191.bin b/pytorch_model-00091-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..8ef4b9583e10950a80bb5d52e7a4530a309af913 --- /dev/null +++ b/pytorch_model-00091-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d61e1aa1e86ad9de7a365e9854e7abe2ff84c35d0cccdbc5feda767a171793f0 +size 4630580764 diff --git a/pytorch_model-00092-of-00191.bin b/pytorch_model-00092-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e82b10cd66b70539fa71768e915506fe5497105 --- /dev/null +++ b/pytorch_model-00092-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:875aaf1e2fde0b4effecf47c7b8abe5aeb8ea1b56c1c98458712c6dfd2ab5a47 +size 3489662678 diff --git a/pytorch_model-00093-of-00191.bin b/pytorch_model-00093-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c5874d5c99c65d28ae9be171ed61fdf1cea0956 --- /dev/null +++ b/pytorch_model-00093-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66eb104046b460d49d4f6994e4be76119fa9739f190bec05a8b4a1c9ecd3c95b +size 4630580764 diff --git a/pytorch_model-00095-of-00191.bin b/pytorch_model-00095-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f135bd60de433a3a043cd0c3282c288d182e90cc --- /dev/null +++ b/pytorch_model-00095-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a6c1eef1d34e3cec44e68ce14817ced8c1b9fe914fcac8a875583c077988638 +size 3489662678 diff --git a/pytorch_model-00096-of-00191.bin b/pytorch_model-00096-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..5c3e7919dbddfb27d0f07845193d4ac8834bea69 --- /dev/null +++ b/pytorch_model-00096-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4918269951d3365d443a3960432368d914b6b70403670a79605cc14cbb3c6de +size 4630580764 diff --git a/pytorch_model-00097-of-00191.bin b/pytorch_model-00097-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ffabf88133c0f7eecf074f3721aabd52c114c8c --- /dev/null +++ b/pytorch_model-00097-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49ee6c2bb7444adc71b96176f2d4747f710ff370b84f51f0ea1c387c2c36c88d +size 4630580764 diff --git a/pytorch_model-00098-of-00191.bin b/pytorch_model-00098-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..a23ebc4e485035bcc7f2decdbeeb00f7ee923109 --- /dev/null +++ b/pytorch_model-00098-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:020dda85dd8f53abaf6791b1251c699c475720294bd10c978d3b16b4110a0295 +size 3489662678 diff --git a/pytorch_model-00099-of-00191.bin b/pytorch_model-00099-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..a41ad500b6976381679e4e6f7018394f3d0169ee --- /dev/null +++ b/pytorch_model-00099-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6674e96ef2eb816285ee6060fd9d4b049d0b51ecd1a83743bdd00fbb045ea41a +size 4630580764 diff --git a/pytorch_model-00100-of-00191.bin b/pytorch_model-00100-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a3a6aa1d335324669080ab1680334a22c925b00 --- /dev/null +++ b/pytorch_model-00100-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bc4fce7a8930f708e67b04e95e86d9eb30ee81605c372476a0ed0df82c6cb06 +size 4630580764 diff --git a/pytorch_model-00101-of-00191.bin b/pytorch_model-00101-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c307bb4b4fa9c5b561404ae7cde9eedb5f50e46 --- /dev/null +++ b/pytorch_model-00101-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f245c32fd2855730c9b95d13eca642667ae3355ffe422f351348a5d4fdcee749 +size 3489662678 diff --git a/pytorch_model-00104-of-00191.bin b/pytorch_model-00104-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a83930b13eff76a7a33ef9f3d24a08df9e19330 --- /dev/null +++ b/pytorch_model-00104-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24926290effa6e7bdb93fcdf3a122ea2d70fa64b7f8f04baf98bac0c379ebb12 +size 3489662678 diff --git a/pytorch_model-00105-of-00191.bin b/pytorch_model-00105-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..fed1b12873e10e5b802aa85b1f356d49d72ceabe --- /dev/null +++ b/pytorch_model-00105-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7925473ed65059dd21c1d0ebb371858629440ea2ca27f792a6c875f00ab34213 +size 4630580764 diff --git a/pytorch_model-00106-of-00191.bin b/pytorch_model-00106-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e1bf8dc1403329f3e3f2d17276324cc1af83ba7 --- /dev/null +++ b/pytorch_model-00106-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6af2cf8aaa85325e6eab7a190db6578472915114ad13ae9c4db315d59a02b98 +size 4630580764 diff --git a/pytorch_model-00107-of-00191.bin b/pytorch_model-00107-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..11571b507f8d274f6292c4edca562af268f28dd5 --- /dev/null +++ b/pytorch_model-00107-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8287ff62e756a32d662de0eb98f4beb07c60c40297dea969eca1ef972f178be +size 3489662678 diff --git a/pytorch_model-00108-of-00191.bin b/pytorch_model-00108-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..0bbf06ea06c279e0e26121ebef1409f8197de17d --- /dev/null +++ b/pytorch_model-00108-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc39fbcfdbda8a2f31691eade3162304b26a5bcb265639908aca1b888cbd2ce +size 4630580764 diff --git a/pytorch_model-00109-of-00191.bin b/pytorch_model-00109-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..fac3b25a9c280252f418581ba32c06bf6806fafe --- /dev/null +++ b/pytorch_model-00109-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf11e3b6286dbf270f9d45167d35f3200a837d0625c4f268970b8729860e6630 +size 4630580764 diff --git a/pytorch_model-00111-of-00191.bin b/pytorch_model-00111-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..46505cd10be3ef27eb0009153a22e52d468f50fe --- /dev/null +++ b/pytorch_model-00111-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad196ecd903c575b7fb697c0e7f1b7eed4e5a70da52a9af9e73f442d6d38aac +size 4630580764 diff --git a/pytorch_model-00112-of-00191.bin b/pytorch_model-00112-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..3194092529024ac36b1630899cb70767039427a0 --- /dev/null +++ b/pytorch_model-00112-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f19b915b12484d576c5a47e1856a33acbf547f4fb7e4dd8b578e326aef9f25 +size 4630580764 diff --git a/pytorch_model-00113-of-00191.bin b/pytorch_model-00113-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..31efd58febf69bb922463820484d6f807132d683 --- /dev/null +++ b/pytorch_model-00113-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f97ffbac3446a92217fbfbfce1f606f746c7c70570575661fcf565013d9e2a9 +size 3489662678 diff --git a/pytorch_model-00114-of-00191.bin b/pytorch_model-00114-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..5476cfa1721395431a205fb6cf5ed30073756310 --- /dev/null +++ b/pytorch_model-00114-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414ec146147fec5c3bd3eb1497574e65458e764ebb6070411202759d4893d8f5 +size 4630580764 diff --git a/pytorch_model-00116-of-00191.bin b/pytorch_model-00116-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..351456f8ea59259e588c8f82f20778a04b431450 --- /dev/null +++ b/pytorch_model-00116-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af15bbd12b9539727e7a7908120e29c10caaa434ecaf2384d211ec002960cad3 +size 3489662678 diff --git a/pytorch_model-00119-of-00191.bin b/pytorch_model-00119-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..8946cd18ff721ec730b17763e04bef4ba8374e79 --- /dev/null +++ b/pytorch_model-00119-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33007248f7cd5f70bf88c5b2d1de01ff309e846bfaacfdc292482aca38025cc9 +size 3489662678 diff --git a/pytorch_model-00120-of-00191.bin b/pytorch_model-00120-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..3b1cd2f403e8b82fcb54ee2ceeb44a5ab54392da --- /dev/null +++ b/pytorch_model-00120-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be00c8cd44fbfe182448686c8d91d43391f2418f4ff201593e449f7abf83e85c +size 4630580764 diff --git a/pytorch_model-00122-of-00191.bin b/pytorch_model-00122-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1ccc1c725ddc0000d8121b58f222d15eb16076d --- /dev/null +++ b/pytorch_model-00122-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a970c62cd8a5f26ecf929df7633b237a41bddd6ce121ac11f4f61e088a4e2da +size 3489662678 diff --git a/pytorch_model-00124-of-00191.bin b/pytorch_model-00124-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..921ff4037439e517f2ffc5a56ae81cf5bf1677db --- /dev/null +++ b/pytorch_model-00124-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff9d34aefb2dc527f9de43b4a97a0ec6225b70610950181363939d281838eea2 +size 4630580764 diff --git a/pytorch_model-00125-of-00191.bin b/pytorch_model-00125-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0376d3cdf25ca5359eb2635440a2596633029aa --- /dev/null +++ b/pytorch_model-00125-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2c067bbce67204375700d2fc3d146a2bbc5d37aef23548d80fe7a343f4795e3 +size 3489662678 diff --git a/pytorch_model-00127-of-00191.bin b/pytorch_model-00127-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..be7b82400d454d032cc05eb5352e29210e237be9 --- /dev/null +++ b/pytorch_model-00127-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6de7083ccb9052a79cfe87f7cbaa04078cf90822752e7a8cd0bbdc30ee98872 +size 4630580764 diff --git a/pytorch_model-00129-of-00191.bin b/pytorch_model-00129-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc9373e58ac498e5ca63ac445f28c3ea8ed2c80b --- /dev/null +++ b/pytorch_model-00129-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8098a228ec064184bee56619d693f6010fbf79ca4b3a1dd633ef14d2ea2384d8 +size 4630580764 diff --git a/pytorch_model-00131-of-00191.bin b/pytorch_model-00131-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..6bd3284f399a57766c68d0ce3dc2d32b0daf30e3 --- /dev/null +++ b/pytorch_model-00131-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba60f4e96bfeead066a046821750a96d5a42e9857fd43eb96ba6783dccc83d45 +size 3489662678 diff --git a/pytorch_model-00132-of-00191.bin b/pytorch_model-00132-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..368ad909af6a460edd40300582df1de643ce5b77 --- /dev/null +++ b/pytorch_model-00132-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e7509981af7e2777c0a809ed640590b75b57b1049897027ec618ae4440fc4a +size 4630580764 diff --git a/pytorch_model-00134-of-00191.bin b/pytorch_model-00134-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..a15fa43e427d71839d1bd73acb95664727e49453 --- /dev/null +++ b/pytorch_model-00134-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad42efe8e88e1f9ac9c937a87d030dd0d9032b9e124e0870b0938f584e73aff +size 3489662678 diff --git a/pytorch_model-00139-of-00191.bin b/pytorch_model-00139-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..42ff4df1a43746efea1a37998549b8910b772979 --- /dev/null +++ b/pytorch_model-00139-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e14b82f4cf2bae81eedcffb10e9c04ba3ed634db36ef9b1e73825468f3879a2 +size 4630580764 diff --git a/pytorch_model-00140-of-00191.bin b/pytorch_model-00140-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..462382fb9c6f82b9dcca6387ccbf9451f7d41b04 --- /dev/null +++ b/pytorch_model-00140-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:403c3764e4165b8d97fb76cddbf0330b7443134f5079bb8cb283ecbbb182667c +size 3489662678 diff --git a/pytorch_model-00141-of-00191.bin b/pytorch_model-00141-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..88ec5b090dc8ff422c74a63ac6fcbdf0131b24e0 --- /dev/null +++ b/pytorch_model-00141-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab32c285b334da358cae2821c707770dc98433ceb7817ab1ce9bf95c45567ffd +size 4630580764 diff --git a/pytorch_model-00142-of-00191.bin b/pytorch_model-00142-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9b5811460857769b7af34243e89e30e6df32967 --- /dev/null +++ b/pytorch_model-00142-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432f1e5312c0440e2e0794ec0b94a4c133434f828ea1fa72eaa2914b9a62306d +size 4630580764 diff --git a/pytorch_model-00144-of-00191.bin b/pytorch_model-00144-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..aab9597a555f51c1c99b3de10c43d8aa3f22fb62 --- /dev/null +++ b/pytorch_model-00144-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f544a9ebc050f031e4f6e28109b3ea710b2b4e7318b8915c4cb635bb701aec07 +size 4630580764 diff --git a/pytorch_model-00145-of-00191.bin b/pytorch_model-00145-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..048f11fc00ce3f90aa496bbc8880e0c6a26f9419 --- /dev/null +++ b/pytorch_model-00145-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9baa3cc43d62f9d8d11d58a4c72cd353fb336504a8831c00c1ceb0afa7f7c5b9 +size 4630580764 diff --git a/pytorch_model-00146-of-00191.bin b/pytorch_model-00146-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..30098c5ec8d353e87999a3c1ad1b0f5b3fec5316 --- /dev/null +++ b/pytorch_model-00146-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:125d38a07314b88b9d84b0b38d3c1fb61c4acd850d1d378f39d79a554c69a31c +size 3489662678 diff --git a/pytorch_model-00149-of-00191.bin b/pytorch_model-00149-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..43bf5224639c903b87e98504abc12b2f4052085b --- /dev/null +++ b/pytorch_model-00149-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e45eef58e12100c47ee12e9f4756959fab9d88f6129ac8fc49032bfe6b48124 +size 3489662678 diff --git a/pytorch_model-00150-of-00191.bin b/pytorch_model-00150-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..2609e8aee9c8be138f67a49467ffefbfc824bf92 --- /dev/null +++ b/pytorch_model-00150-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b572688a0b5470c28018b8d6a631b5593068f3f8a48aca8aff403c3e14805417 +size 4630580764 diff --git a/pytorch_model-00151-of-00191.bin b/pytorch_model-00151-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3ec623b7c02a854154a07d349e88229f16dea13 --- /dev/null +++ b/pytorch_model-00151-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6088ae73808732e5bfee283d606a03cca8e9a770562c20804bec964064e02d88 +size 4630580764 diff --git a/pytorch_model-00152-of-00191.bin b/pytorch_model-00152-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..052040e9ac39dba6bd15fe4bfa090746cefa19eb --- /dev/null +++ b/pytorch_model-00152-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5d9e1a9c26c29b881090d887f4dd3fd09566a571238d216f8add1fde33c9a3 +size 3489662678 diff --git a/pytorch_model-00153-of-00191.bin b/pytorch_model-00153-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..de9f025ae125e5a57b2fe3e06cff839e782a3e66 --- /dev/null +++ b/pytorch_model-00153-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9bdbcd5782faeaa02ccf819ea6cafa9f9060df21080ca42715c4084a1962e7 +size 4630580828 diff --git a/pytorch_model-00154-of-00191.bin b/pytorch_model-00154-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5c85aa4c4e5da19f3f93e6e85471180a72b2890 --- /dev/null +++ b/pytorch_model-00154-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb58ec031c8f49f8903c1f4e71dd266064546eaa1c3c4d6ad422ed071ce1c260 +size 4630580828 diff --git a/pytorch_model-00156-of-00191.bin b/pytorch_model-00156-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..444eabc8fe2e88216a1a4e482873c939a4b8bfda --- /dev/null +++ b/pytorch_model-00156-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94d89a3d181a0103a93335bbe73dabbef851e71042b00000c67c5f6a6e610a3d +size 4630580828 diff --git a/pytorch_model-00157-of-00191.bin b/pytorch_model-00157-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..451a9f826f959e94235699d97580a3a5f1e701e1 --- /dev/null +++ b/pytorch_model-00157-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:811b95ab8d2873b75c826edb738cd720bc4c1477d00bd3dbaa85cd745902fce9 +size 4630580828 diff --git a/pytorch_model-00158-of-00191.bin b/pytorch_model-00158-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f6514d73e84b3cbe5e20958f17800278024ac07 --- /dev/null +++ b/pytorch_model-00158-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c59bfe8891b5651329c07473666d42ab56306520433daa62a3b4e018de35e1b +size 3489662678 diff --git a/pytorch_model-00159-of-00191.bin b/pytorch_model-00159-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..725e2daebd16c94903a988592771dd79734be9e5 --- /dev/null +++ b/pytorch_model-00159-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69ac8f90510a525733d74c75671368b5737421a21beb619f38fe3b9a33d4d81f +size 4630580828 diff --git a/pytorch_model-00160-of-00191.bin b/pytorch_model-00160-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e4337cc917d3d39b52da7e06ce7675de1d98e21 --- /dev/null +++ b/pytorch_model-00160-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77f2fe82c501647799c36101f9a323d5a674b3c49cc9f5c298bef18471d5577 +size 4630580828 diff --git a/pytorch_model-00161-of-00191.bin b/pytorch_model-00161-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..471beaa971c4eb2c31bac2a001ff9030761d2e3c --- /dev/null +++ b/pytorch_model-00161-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3894c57a21a74d0de37fcf0989b5b5489b3bf2c85b6bda5bd191ff3d6350082 +size 3489662678 diff --git a/pytorch_model-00162-of-00191.bin b/pytorch_model-00162-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..fab26500f4e13cbb4d0018abb3de743c82908f16 --- /dev/null +++ b/pytorch_model-00162-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c76ac219cb7dd7b9f059ca6bc3ee4a4ca89f80e3fffc7e124f38c5d44b68c042 +size 4630580828 diff --git a/pytorch_model-00163-of-00191.bin b/pytorch_model-00163-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6c043d0ae7c0c2675aad53214e20e78e354e70e --- /dev/null +++ b/pytorch_model-00163-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e4c2a36ed3dc7051b379c8b4d8076978c31627a40112a65d28b1dc6bd09e12 +size 4630580828 diff --git a/pytorch_model-00164-of-00191.bin b/pytorch_model-00164-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..49e9e6b315f54da1053297213bcd645478a184d3 --- /dev/null +++ b/pytorch_model-00164-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7a45c15d6f45c0fd41f5a7dbbdc8f6f80be094333d36d940cf056ed7a599e3 +size 3489662678 diff --git a/pytorch_model-00165-of-00191.bin b/pytorch_model-00165-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7171aa057e1550e0ad856afd93f379580cbd2bd --- /dev/null +++ b/pytorch_model-00165-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d7d4aace3b5d7f227b082bdcae29913e5866fcbcee4e67aa03d72d4b8c4dd37 +size 4630580828 diff --git a/pytorch_model-00167-of-00191.bin b/pytorch_model-00167-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab0771eacece523b405962ee9f587d72b1197ee2 --- /dev/null +++ b/pytorch_model-00167-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de2734346b56857cbbbae5857ba8262463b46ad3f35ac6d3afd7a97a92310e54 +size 3489662678 diff --git a/pytorch_model-00168-of-00191.bin b/pytorch_model-00168-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b561d3acab1686baea913dc74fd4dbc516cf947 --- /dev/null +++ b/pytorch_model-00168-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a6bbbacef462d2e105a8ed58cc66c3da060e43131eb95f898f3e6c12b10a963 +size 4630580828 diff --git a/pytorch_model-00169-of-00191.bin b/pytorch_model-00169-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..f90683c7d00d2e996eab0698af245056eb2b1c4a --- /dev/null +++ b/pytorch_model-00169-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e67b45aefd91474b4d36f992a488431a0f3c6a0f609955ea80f6e91885b1d87 +size 4630580828 diff --git a/pytorch_model-00170-of-00191.bin b/pytorch_model-00170-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa2b29d3a12e575135fdd8dfcc679b0fe9537a29 --- /dev/null +++ b/pytorch_model-00170-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55872e54e14e6cbcd6f9bcfe1bda51d3ea51d74909ccb90f31c87d47a562714c +size 3489662678 diff --git a/pytorch_model-00172-of-00191.bin b/pytorch_model-00172-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..649d55c2ee0d5b9d937e43d50d466df9050e0a8b --- /dev/null +++ b/pytorch_model-00172-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5a9421866dd50ca63b3addd247ebbeb3b66c4595176a601c14e8f93076b595b +size 4630580828 diff --git a/pytorch_model-00173-of-00191.bin b/pytorch_model-00173-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..6fca575d1e0930e7cf2f90d65c9a962a4f6e5025 --- /dev/null +++ b/pytorch_model-00173-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c569403e0ea5a25b30a9121c5de473b95e50821c2d08939dbfaf3d2e503be8e4 +size 3489662678 diff --git a/pytorch_model-00174-of-00191.bin b/pytorch_model-00174-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..eda27eac93a7f102a821d78108cc051a17f36d64 --- /dev/null +++ b/pytorch_model-00174-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd3cb397b74380238e32c213700a53cd941fbdfaf41b696534fae733ac0821e1 +size 4630580828 diff --git a/pytorch_model-00175-of-00191.bin b/pytorch_model-00175-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7d194c55b862f583c4b33c022e95515f5314ca2 --- /dev/null +++ b/pytorch_model-00175-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de04764e58b44c4330d7922817768c1a3d1908057f1709dc0e0c6c522ebd181b +size 4630580828 diff --git a/pytorch_model-00176-of-00191.bin b/pytorch_model-00176-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6201fe85082326813edf8bb55ebbbfb42cf056d --- /dev/null +++ b/pytorch_model-00176-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c551d3a4d11be7c4d9758f2cf55929264f8356d7e030783ad91ce7a1bff9e81 +size 3489662678 diff --git a/pytorch_model-00177-of-00191.bin b/pytorch_model-00177-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..9911d47a3fd4dbf685d4062bbc4f9639c81fe6bc --- /dev/null +++ b/pytorch_model-00177-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3a23fb5425ad69feaf8df2b40b14ae9becbc6df373e353abd6a08538500f4f6 +size 4630580828 diff --git a/pytorch_model-00178-of-00191.bin b/pytorch_model-00178-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b1adfd86ff7d440dd112393e0717360d642c9c67 --- /dev/null +++ b/pytorch_model-00178-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dcef4e99586090bcdae8eaa3733f5c8b0820efc988b61d6e66f5a10318fa300 +size 4630580828 diff --git a/pytorch_model-00179-of-00191.bin b/pytorch_model-00179-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b7008bd09e4f81fb8d89870002884295cb75f7af --- /dev/null +++ b/pytorch_model-00179-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bfa1a8a2380a53cff7ce71087d942a7fb4f115eb7ec8db280c083e0c09fd27c +size 3489662678 diff --git a/pytorch_model-00181-of-00191.bin b/pytorch_model-00181-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..1be3f4e630f92bb71a94caf88ee5188135bb5acc --- /dev/null +++ b/pytorch_model-00181-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033564aecb61a1aa3946ac256ff6b413724e3f95bcad763f82d575ddf25ea8e6 +size 4630580828 diff --git a/pytorch_model-00182-of-00191.bin b/pytorch_model-00182-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..e708ebf52291ee7766fea5c3bf6db602c2c6c9dd --- /dev/null +++ b/pytorch_model-00182-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f813c4b32fa402a70f7ea5dd3feba525ab497c8dd16c21fc3c680a790ff6f85f +size 3489662678 diff --git a/pytorch_model-00183-of-00191.bin b/pytorch_model-00183-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e5f218fec6c5d6e13946b1410f817cd93174b1e --- /dev/null +++ b/pytorch_model-00183-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386973e9ed16a7c3668d9267e1ff38fc187771480057e339a2b4f7c50fa1bd66 +size 4630580828 diff --git a/pytorch_model-00184-of-00191.bin b/pytorch_model-00184-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..4403be2732a382969b9db05376540c5e36a6e949 --- /dev/null +++ b/pytorch_model-00184-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb088c5c295f9221a908ed30461efbb1a57e75683ed7ac68eaaae8c26c86b8c +size 4630580828 diff --git a/pytorch_model-00185-of-00191.bin b/pytorch_model-00185-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..40cbeea88bebdf2242d84350f38d826fe344ee34 --- /dev/null +++ b/pytorch_model-00185-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfb146823d2724f1cc360305f98dc2d7e1eb3c0167f221c99df103e66331574 +size 3489662678 diff --git a/pytorch_model-00186-of-00191.bin b/pytorch_model-00186-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ebb420fe29b36f194ded7b47519ebec7e0fb253 --- /dev/null +++ b/pytorch_model-00186-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1fc64389869c4e7227fd6e4f9c6e5f4f4810d35713c402a3dbbf895140254d2 +size 4630580828 diff --git a/pytorch_model-00187-of-00191.bin b/pytorch_model-00187-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..b1fd4e175611c99cbc3f58ab9627f5bfea3be223 --- /dev/null +++ b/pytorch_model-00187-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4568906b2399dd0a5e19a70aab9f4092a210e8bd579a1061a3d2e624a8cb2081 +size 4630580828 diff --git a/pytorch_model-00190-of-00191.bin b/pytorch_model-00190-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c799bf3cab1b8cf8f560fb18a42fa9c15c9d3ac --- /dev/null +++ b/pytorch_model-00190-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85d4f60a8d0a0b5d9003d62af2d2f62decc8911f062b4ad94a20ee3f6d7dc4f +size 3489761865 diff --git a/pytorch_model-00191-of-00191.bin b/pytorch_model-00191-of-00191.bin new file mode 100644 index 0000000000000000000000000000000000000000..3018f177b9c21086f0d1a3687a3aa01e572adf4e --- /dev/null +++ b/pytorch_model-00191-of-00191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02a11b2417d6ae9a9acf0ffd510a8fd9e9c488c383c93852217d59e4648475d5 +size 4202956165 diff --git a/pytorch_model.bin.index.json b/pytorch_model.bin.index.json new file mode 100644 index 0000000000000000000000000000000000000000..47972247867e3089195ae718798efd5534931a11 --- /dev/null +++ b/pytorch_model.bin.index.json @@ -0,0 +1,1144 @@ +{ + "metadata": { + "total_size": 811707301888 + }, + "weight_map": { + "lm_head.weight": "pytorch_model-00191-of-00191.bin", + "model.embed_tokens.weight": "pytorch_model-00001-of-00191.bin", + "model.layers.0.input_layernorm.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.0.mlp.down_proj.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.0.mlp.gate_proj.weight": "pytorch_model-00002-of-00191.bin", + "model.layers.0.mlp.up_proj.weight": "pytorch_model-00002-of-00191.bin", + "model.layers.0.post_attention_layernorm.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.0.self_attn.k_proj.weight": "pytorch_model-00001-of-00191.bin", + "model.layers.0.self_attn.o_proj.weight": "pytorch_model-00002-of-00191.bin", + "model.layers.0.self_attn.q_proj.weight": "pytorch_model-00001-of-00191.bin", + "model.layers.0.self_attn.v_proj.weight": "pytorch_model-00001-of-00191.bin", + "model.layers.1.input_layernorm.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.1.mlp.down_proj.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.1.mlp.gate_proj.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.1.mlp.up_proj.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.1.post_attention_layernorm.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.1.self_attn.k_proj.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.1.self_attn.o_proj.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.1.self_attn.q_proj.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.1.self_attn.v_proj.weight": "pytorch_model-00003-of-00191.bin", + "model.layers.10.input_layernorm.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.10.mlp.down_proj.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.10.mlp.gate_proj.weight": "pytorch_model-00017-of-00191.bin", + "model.layers.10.mlp.up_proj.weight": "pytorch_model-00017-of-00191.bin", + "model.layers.10.post_attention_layernorm.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.10.self_attn.k_proj.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.10.self_attn.o_proj.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.10.self_attn.q_proj.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.10.self_attn.v_proj.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.100.input_layernorm.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.100.mlp.down_proj.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.100.mlp.gate_proj.weight": "pytorch_model-00152-of-00191.bin", + "model.layers.100.mlp.up_proj.weight": "pytorch_model-00152-of-00191.bin", + "model.layers.100.post_attention_layernorm.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.100.self_attn.k_proj.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.100.self_attn.o_proj.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.100.self_attn.q_proj.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.100.self_attn.v_proj.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.101.input_layernorm.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.101.mlp.down_proj.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.101.mlp.gate_proj.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.101.mlp.up_proj.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.101.post_attention_layernorm.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.101.self_attn.k_proj.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.101.self_attn.o_proj.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.101.self_attn.q_proj.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.101.self_attn.v_proj.weight": "pytorch_model-00153-of-00191.bin", + "model.layers.102.input_layernorm.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.102.mlp.down_proj.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.102.mlp.gate_proj.weight": "pytorch_model-00155-of-00191.bin", + "model.layers.102.mlp.up_proj.weight": "pytorch_model-00155-of-00191.bin", + "model.layers.102.post_attention_layernorm.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.102.self_attn.k_proj.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.102.self_attn.o_proj.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.102.self_attn.q_proj.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.102.self_attn.v_proj.weight": "pytorch_model-00154-of-00191.bin", + "model.layers.103.input_layernorm.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.103.mlp.down_proj.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.103.mlp.gate_proj.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.103.mlp.up_proj.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.103.post_attention_layernorm.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.103.self_attn.k_proj.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.103.self_attn.o_proj.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.103.self_attn.q_proj.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.103.self_attn.v_proj.weight": "pytorch_model-00156-of-00191.bin", + "model.layers.104.input_layernorm.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.104.mlp.down_proj.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.104.mlp.gate_proj.weight": "pytorch_model-00158-of-00191.bin", + "model.layers.104.mlp.up_proj.weight": "pytorch_model-00158-of-00191.bin", + "model.layers.104.post_attention_layernorm.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.104.self_attn.k_proj.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.104.self_attn.o_proj.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.104.self_attn.q_proj.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.104.self_attn.v_proj.weight": "pytorch_model-00157-of-00191.bin", + "model.layers.105.input_layernorm.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.105.mlp.down_proj.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.105.mlp.gate_proj.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.105.mlp.up_proj.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.105.post_attention_layernorm.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.105.self_attn.k_proj.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.105.self_attn.o_proj.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.105.self_attn.q_proj.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.105.self_attn.v_proj.weight": "pytorch_model-00159-of-00191.bin", + "model.layers.106.input_layernorm.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.106.mlp.down_proj.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.106.mlp.gate_proj.weight": "pytorch_model-00161-of-00191.bin", + "model.layers.106.mlp.up_proj.weight": "pytorch_model-00161-of-00191.bin", + "model.layers.106.post_attention_layernorm.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.106.self_attn.k_proj.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.106.self_attn.o_proj.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.106.self_attn.q_proj.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.106.self_attn.v_proj.weight": "pytorch_model-00160-of-00191.bin", + "model.layers.107.input_layernorm.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.107.mlp.down_proj.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.107.mlp.gate_proj.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.107.mlp.up_proj.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.107.post_attention_layernorm.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.107.self_attn.k_proj.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.107.self_attn.o_proj.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.107.self_attn.q_proj.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.107.self_attn.v_proj.weight": "pytorch_model-00162-of-00191.bin", + "model.layers.108.input_layernorm.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.108.mlp.down_proj.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.108.mlp.gate_proj.weight": "pytorch_model-00164-of-00191.bin", + "model.layers.108.mlp.up_proj.weight": "pytorch_model-00164-of-00191.bin", + "model.layers.108.post_attention_layernorm.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.108.self_attn.k_proj.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.108.self_attn.o_proj.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.108.self_attn.q_proj.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.108.self_attn.v_proj.weight": "pytorch_model-00163-of-00191.bin", + "model.layers.109.input_layernorm.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.109.mlp.down_proj.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.109.mlp.gate_proj.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.109.mlp.up_proj.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.109.post_attention_layernorm.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.109.self_attn.k_proj.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.109.self_attn.o_proj.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.109.self_attn.q_proj.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.109.self_attn.v_proj.weight": "pytorch_model-00165-of-00191.bin", + "model.layers.11.input_layernorm.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.11.mlp.down_proj.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.11.mlp.gate_proj.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.11.mlp.up_proj.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.11.post_attention_layernorm.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.11.self_attn.k_proj.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.11.self_attn.o_proj.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.11.self_attn.q_proj.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.11.self_attn.v_proj.weight": "pytorch_model-00018-of-00191.bin", + "model.layers.110.input_layernorm.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.110.mlp.down_proj.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.110.mlp.gate_proj.weight": "pytorch_model-00167-of-00191.bin", + "model.layers.110.mlp.up_proj.weight": "pytorch_model-00167-of-00191.bin", + "model.layers.110.post_attention_layernorm.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.110.self_attn.k_proj.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.110.self_attn.o_proj.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.110.self_attn.q_proj.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.110.self_attn.v_proj.weight": "pytorch_model-00166-of-00191.bin", + "model.layers.111.input_layernorm.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.111.mlp.down_proj.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.111.mlp.gate_proj.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.111.mlp.up_proj.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.111.post_attention_layernorm.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.111.self_attn.k_proj.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.111.self_attn.o_proj.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.111.self_attn.q_proj.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.111.self_attn.v_proj.weight": "pytorch_model-00168-of-00191.bin", + "model.layers.112.input_layernorm.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.112.mlp.down_proj.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.112.mlp.gate_proj.weight": "pytorch_model-00170-of-00191.bin", + "model.layers.112.mlp.up_proj.weight": "pytorch_model-00170-of-00191.bin", + "model.layers.112.post_attention_layernorm.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.112.self_attn.k_proj.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.112.self_attn.o_proj.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.112.self_attn.q_proj.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.112.self_attn.v_proj.weight": "pytorch_model-00169-of-00191.bin", + "model.layers.113.input_layernorm.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.113.mlp.down_proj.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.113.mlp.gate_proj.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.113.mlp.up_proj.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.113.post_attention_layernorm.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.113.self_attn.k_proj.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.113.self_attn.o_proj.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.113.self_attn.q_proj.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.113.self_attn.v_proj.weight": "pytorch_model-00171-of-00191.bin", + "model.layers.114.input_layernorm.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.114.mlp.down_proj.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.114.mlp.gate_proj.weight": "pytorch_model-00173-of-00191.bin", + "model.layers.114.mlp.up_proj.weight": "pytorch_model-00173-of-00191.bin", + "model.layers.114.post_attention_layernorm.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.114.self_attn.k_proj.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.114.self_attn.o_proj.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.114.self_attn.q_proj.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.114.self_attn.v_proj.weight": "pytorch_model-00172-of-00191.bin", + "model.layers.115.input_layernorm.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.115.mlp.down_proj.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.115.mlp.gate_proj.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.115.mlp.up_proj.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.115.post_attention_layernorm.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.115.self_attn.k_proj.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.115.self_attn.o_proj.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.115.self_attn.q_proj.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.115.self_attn.v_proj.weight": "pytorch_model-00174-of-00191.bin", + "model.layers.116.input_layernorm.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.116.mlp.down_proj.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.116.mlp.gate_proj.weight": "pytorch_model-00176-of-00191.bin", + "model.layers.116.mlp.up_proj.weight": "pytorch_model-00176-of-00191.bin", + "model.layers.116.post_attention_layernorm.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.116.self_attn.k_proj.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.116.self_attn.o_proj.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.116.self_attn.q_proj.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.116.self_attn.v_proj.weight": "pytorch_model-00175-of-00191.bin", + "model.layers.117.input_layernorm.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.117.mlp.down_proj.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.117.mlp.gate_proj.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.117.mlp.up_proj.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.117.post_attention_layernorm.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.117.self_attn.k_proj.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.117.self_attn.o_proj.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.117.self_attn.q_proj.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.117.self_attn.v_proj.weight": "pytorch_model-00177-of-00191.bin", + "model.layers.118.input_layernorm.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.118.mlp.down_proj.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.118.mlp.gate_proj.weight": "pytorch_model-00179-of-00191.bin", + "model.layers.118.mlp.up_proj.weight": "pytorch_model-00179-of-00191.bin", + "model.layers.118.post_attention_layernorm.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.118.self_attn.k_proj.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.118.self_attn.o_proj.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.118.self_attn.q_proj.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.118.self_attn.v_proj.weight": "pytorch_model-00178-of-00191.bin", + "model.layers.119.input_layernorm.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.119.mlp.down_proj.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.119.mlp.gate_proj.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.119.mlp.up_proj.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.119.post_attention_layernorm.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.119.self_attn.k_proj.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.119.self_attn.o_proj.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.119.self_attn.q_proj.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.119.self_attn.v_proj.weight": "pytorch_model-00180-of-00191.bin", + "model.layers.12.input_layernorm.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.12.mlp.down_proj.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.12.mlp.gate_proj.weight": "pytorch_model-00020-of-00191.bin", + "model.layers.12.mlp.up_proj.weight": "pytorch_model-00020-of-00191.bin", + "model.layers.12.post_attention_layernorm.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.12.self_attn.k_proj.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.12.self_attn.o_proj.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.12.self_attn.q_proj.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.12.self_attn.v_proj.weight": "pytorch_model-00019-of-00191.bin", + "model.layers.120.input_layernorm.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.120.mlp.down_proj.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.120.mlp.gate_proj.weight": "pytorch_model-00182-of-00191.bin", + "model.layers.120.mlp.up_proj.weight": "pytorch_model-00182-of-00191.bin", + "model.layers.120.post_attention_layernorm.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.120.self_attn.k_proj.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.120.self_attn.o_proj.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.120.self_attn.q_proj.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.120.self_attn.v_proj.weight": "pytorch_model-00181-of-00191.bin", + "model.layers.121.input_layernorm.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.121.mlp.down_proj.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.121.mlp.gate_proj.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.121.mlp.up_proj.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.121.post_attention_layernorm.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.121.self_attn.k_proj.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.121.self_attn.o_proj.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.121.self_attn.q_proj.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.121.self_attn.v_proj.weight": "pytorch_model-00183-of-00191.bin", + "model.layers.122.input_layernorm.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.122.mlp.down_proj.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.122.mlp.gate_proj.weight": "pytorch_model-00185-of-00191.bin", + "model.layers.122.mlp.up_proj.weight": "pytorch_model-00185-of-00191.bin", + "model.layers.122.post_attention_layernorm.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.122.self_attn.k_proj.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.122.self_attn.o_proj.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.122.self_attn.q_proj.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.122.self_attn.v_proj.weight": "pytorch_model-00184-of-00191.bin", + "model.layers.123.input_layernorm.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.123.mlp.down_proj.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.123.mlp.gate_proj.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.123.mlp.up_proj.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.123.post_attention_layernorm.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.123.self_attn.k_proj.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.123.self_attn.o_proj.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.123.self_attn.q_proj.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.123.self_attn.v_proj.weight": "pytorch_model-00186-of-00191.bin", + "model.layers.124.input_layernorm.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.124.mlp.down_proj.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.124.mlp.gate_proj.weight": "pytorch_model-00188-of-00191.bin", + "model.layers.124.mlp.up_proj.weight": "pytorch_model-00188-of-00191.bin", + "model.layers.124.post_attention_layernorm.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.124.self_attn.k_proj.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.124.self_attn.o_proj.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.124.self_attn.q_proj.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.124.self_attn.v_proj.weight": "pytorch_model-00187-of-00191.bin", + "model.layers.125.input_layernorm.weight": "pytorch_model-00190-of-00191.bin", + "model.layers.125.mlp.down_proj.weight": "pytorch_model-00190-of-00191.bin", + "model.layers.125.mlp.gate_proj.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.125.mlp.up_proj.weight": "pytorch_model-00190-of-00191.bin", + "model.layers.125.post_attention_layernorm.weight": "pytorch_model-00190-of-00191.bin", + "model.layers.125.self_attn.k_proj.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.125.self_attn.o_proj.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.125.self_attn.q_proj.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.125.self_attn.v_proj.weight": "pytorch_model-00189-of-00191.bin", + "model.layers.13.input_layernorm.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.13.mlp.down_proj.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.13.mlp.gate_proj.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.13.mlp.up_proj.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.13.post_attention_layernorm.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.13.self_attn.k_proj.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.13.self_attn.o_proj.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.13.self_attn.q_proj.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.13.self_attn.v_proj.weight": "pytorch_model-00021-of-00191.bin", + "model.layers.14.input_layernorm.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.14.mlp.down_proj.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.14.mlp.gate_proj.weight": "pytorch_model-00023-of-00191.bin", + "model.layers.14.mlp.up_proj.weight": "pytorch_model-00023-of-00191.bin", + "model.layers.14.post_attention_layernorm.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.14.self_attn.k_proj.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.14.self_attn.o_proj.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.14.self_attn.q_proj.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.14.self_attn.v_proj.weight": "pytorch_model-00022-of-00191.bin", + "model.layers.15.input_layernorm.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.15.mlp.down_proj.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.15.mlp.gate_proj.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.15.mlp.up_proj.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.15.post_attention_layernorm.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.15.self_attn.k_proj.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.15.self_attn.o_proj.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.15.self_attn.q_proj.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.15.self_attn.v_proj.weight": "pytorch_model-00024-of-00191.bin", + "model.layers.16.input_layernorm.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.16.mlp.down_proj.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.16.mlp.gate_proj.weight": "pytorch_model-00026-of-00191.bin", + "model.layers.16.mlp.up_proj.weight": "pytorch_model-00026-of-00191.bin", + "model.layers.16.post_attention_layernorm.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.16.self_attn.k_proj.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.16.self_attn.o_proj.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.16.self_attn.q_proj.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.16.self_attn.v_proj.weight": "pytorch_model-00025-of-00191.bin", + "model.layers.17.input_layernorm.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.17.mlp.down_proj.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.17.mlp.gate_proj.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.17.mlp.up_proj.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.17.post_attention_layernorm.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.17.self_attn.k_proj.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.17.self_attn.o_proj.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.17.self_attn.q_proj.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.17.self_attn.v_proj.weight": "pytorch_model-00027-of-00191.bin", + "model.layers.18.input_layernorm.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.18.mlp.down_proj.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.18.mlp.gate_proj.weight": "pytorch_model-00029-of-00191.bin", + "model.layers.18.mlp.up_proj.weight": "pytorch_model-00029-of-00191.bin", + "model.layers.18.post_attention_layernorm.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.18.self_attn.k_proj.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.18.self_attn.o_proj.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.18.self_attn.q_proj.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.18.self_attn.v_proj.weight": "pytorch_model-00028-of-00191.bin", + "model.layers.19.input_layernorm.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.19.mlp.down_proj.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.19.mlp.gate_proj.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.19.mlp.up_proj.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.19.post_attention_layernorm.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.19.self_attn.k_proj.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.19.self_attn.o_proj.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.19.self_attn.q_proj.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.19.self_attn.v_proj.weight": "pytorch_model-00030-of-00191.bin", + "model.layers.2.input_layernorm.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.2.mlp.down_proj.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.2.mlp.gate_proj.weight": "pytorch_model-00005-of-00191.bin", + "model.layers.2.mlp.up_proj.weight": "pytorch_model-00005-of-00191.bin", + "model.layers.2.post_attention_layernorm.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.2.self_attn.k_proj.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.2.self_attn.o_proj.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.2.self_attn.q_proj.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.2.self_attn.v_proj.weight": "pytorch_model-00004-of-00191.bin", + "model.layers.20.input_layernorm.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.20.mlp.down_proj.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.20.mlp.gate_proj.weight": "pytorch_model-00032-of-00191.bin", + "model.layers.20.mlp.up_proj.weight": "pytorch_model-00032-of-00191.bin", + "model.layers.20.post_attention_layernorm.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.20.self_attn.k_proj.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.20.self_attn.o_proj.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.20.self_attn.q_proj.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.20.self_attn.v_proj.weight": "pytorch_model-00031-of-00191.bin", + "model.layers.21.input_layernorm.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.21.mlp.down_proj.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.21.mlp.gate_proj.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.21.mlp.up_proj.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.21.post_attention_layernorm.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.21.self_attn.k_proj.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.21.self_attn.o_proj.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.21.self_attn.q_proj.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.21.self_attn.v_proj.weight": "pytorch_model-00033-of-00191.bin", + "model.layers.22.input_layernorm.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.22.mlp.down_proj.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.22.mlp.gate_proj.weight": "pytorch_model-00035-of-00191.bin", + "model.layers.22.mlp.up_proj.weight": "pytorch_model-00035-of-00191.bin", + "model.layers.22.post_attention_layernorm.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.22.self_attn.k_proj.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.22.self_attn.o_proj.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.22.self_attn.q_proj.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.22.self_attn.v_proj.weight": "pytorch_model-00034-of-00191.bin", + "model.layers.23.input_layernorm.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.23.mlp.down_proj.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.23.mlp.gate_proj.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.23.mlp.up_proj.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.23.post_attention_layernorm.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.23.self_attn.k_proj.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.23.self_attn.o_proj.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.23.self_attn.q_proj.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.23.self_attn.v_proj.weight": "pytorch_model-00036-of-00191.bin", + "model.layers.24.input_layernorm.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.24.mlp.down_proj.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.24.mlp.gate_proj.weight": "pytorch_model-00038-of-00191.bin", + "model.layers.24.mlp.up_proj.weight": "pytorch_model-00038-of-00191.bin", + "model.layers.24.post_attention_layernorm.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.24.self_attn.k_proj.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.24.self_attn.o_proj.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.24.self_attn.q_proj.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.24.self_attn.v_proj.weight": "pytorch_model-00037-of-00191.bin", + "model.layers.25.input_layernorm.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.25.mlp.down_proj.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.25.mlp.gate_proj.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.25.mlp.up_proj.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.25.post_attention_layernorm.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.25.self_attn.k_proj.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.25.self_attn.o_proj.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.25.self_attn.q_proj.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.25.self_attn.v_proj.weight": "pytorch_model-00039-of-00191.bin", + "model.layers.26.input_layernorm.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.26.mlp.down_proj.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.26.mlp.gate_proj.weight": "pytorch_model-00041-of-00191.bin", + "model.layers.26.mlp.up_proj.weight": "pytorch_model-00041-of-00191.bin", + "model.layers.26.post_attention_layernorm.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.26.self_attn.k_proj.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.26.self_attn.o_proj.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.26.self_attn.q_proj.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.26.self_attn.v_proj.weight": "pytorch_model-00040-of-00191.bin", + "model.layers.27.input_layernorm.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.27.mlp.down_proj.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.27.mlp.gate_proj.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.27.mlp.up_proj.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.27.post_attention_layernorm.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.27.self_attn.k_proj.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.27.self_attn.o_proj.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.27.self_attn.q_proj.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.27.self_attn.v_proj.weight": "pytorch_model-00042-of-00191.bin", + "model.layers.28.input_layernorm.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.28.mlp.down_proj.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.28.mlp.gate_proj.weight": "pytorch_model-00044-of-00191.bin", + "model.layers.28.mlp.up_proj.weight": "pytorch_model-00044-of-00191.bin", + "model.layers.28.post_attention_layernorm.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.28.self_attn.k_proj.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.28.self_attn.o_proj.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.28.self_attn.q_proj.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.28.self_attn.v_proj.weight": "pytorch_model-00043-of-00191.bin", + "model.layers.29.input_layernorm.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.29.mlp.down_proj.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.29.mlp.gate_proj.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.29.mlp.up_proj.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.29.post_attention_layernorm.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.29.self_attn.k_proj.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.29.self_attn.o_proj.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.29.self_attn.q_proj.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.29.self_attn.v_proj.weight": "pytorch_model-00045-of-00191.bin", + "model.layers.3.input_layernorm.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.3.mlp.down_proj.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.3.mlp.gate_proj.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.3.mlp.up_proj.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.3.post_attention_layernorm.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.3.self_attn.k_proj.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.3.self_attn.o_proj.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.3.self_attn.q_proj.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.3.self_attn.v_proj.weight": "pytorch_model-00006-of-00191.bin", + "model.layers.30.input_layernorm.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.30.mlp.down_proj.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.30.mlp.gate_proj.weight": "pytorch_model-00047-of-00191.bin", + "model.layers.30.mlp.up_proj.weight": "pytorch_model-00047-of-00191.bin", + "model.layers.30.post_attention_layernorm.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.30.self_attn.k_proj.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.30.self_attn.o_proj.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.30.self_attn.q_proj.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.30.self_attn.v_proj.weight": "pytorch_model-00046-of-00191.bin", + "model.layers.31.input_layernorm.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.31.mlp.down_proj.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.31.mlp.gate_proj.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.31.mlp.up_proj.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.31.post_attention_layernorm.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.31.self_attn.k_proj.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.31.self_attn.o_proj.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.31.self_attn.q_proj.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.31.self_attn.v_proj.weight": "pytorch_model-00048-of-00191.bin", + "model.layers.32.input_layernorm.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.32.mlp.down_proj.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.32.mlp.gate_proj.weight": "pytorch_model-00050-of-00191.bin", + "model.layers.32.mlp.up_proj.weight": "pytorch_model-00050-of-00191.bin", + "model.layers.32.post_attention_layernorm.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.32.self_attn.k_proj.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.32.self_attn.o_proj.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.32.self_attn.q_proj.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.32.self_attn.v_proj.weight": "pytorch_model-00049-of-00191.bin", + "model.layers.33.input_layernorm.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.33.mlp.down_proj.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.33.mlp.gate_proj.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.33.mlp.up_proj.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.33.post_attention_layernorm.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.33.self_attn.k_proj.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.33.self_attn.o_proj.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.33.self_attn.q_proj.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.33.self_attn.v_proj.weight": "pytorch_model-00051-of-00191.bin", + "model.layers.34.input_layernorm.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.34.mlp.down_proj.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.34.mlp.gate_proj.weight": "pytorch_model-00053-of-00191.bin", + "model.layers.34.mlp.up_proj.weight": "pytorch_model-00053-of-00191.bin", + "model.layers.34.post_attention_layernorm.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.34.self_attn.k_proj.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.34.self_attn.o_proj.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.34.self_attn.q_proj.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.34.self_attn.v_proj.weight": "pytorch_model-00052-of-00191.bin", + "model.layers.35.input_layernorm.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.35.mlp.down_proj.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.35.mlp.gate_proj.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.35.mlp.up_proj.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.35.post_attention_layernorm.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.35.self_attn.k_proj.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.35.self_attn.o_proj.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.35.self_attn.q_proj.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.35.self_attn.v_proj.weight": "pytorch_model-00054-of-00191.bin", + "model.layers.36.input_layernorm.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.36.mlp.down_proj.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.36.mlp.gate_proj.weight": "pytorch_model-00056-of-00191.bin", + "model.layers.36.mlp.up_proj.weight": "pytorch_model-00056-of-00191.bin", + "model.layers.36.post_attention_layernorm.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.36.self_attn.k_proj.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.36.self_attn.o_proj.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.36.self_attn.q_proj.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.36.self_attn.v_proj.weight": "pytorch_model-00055-of-00191.bin", + "model.layers.37.input_layernorm.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.37.mlp.down_proj.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.37.mlp.gate_proj.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.37.mlp.up_proj.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.37.post_attention_layernorm.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.37.self_attn.k_proj.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.37.self_attn.o_proj.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.37.self_attn.q_proj.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.37.self_attn.v_proj.weight": "pytorch_model-00057-of-00191.bin", + "model.layers.38.input_layernorm.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.38.mlp.down_proj.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.38.mlp.gate_proj.weight": "pytorch_model-00059-of-00191.bin", + "model.layers.38.mlp.up_proj.weight": "pytorch_model-00059-of-00191.bin", + "model.layers.38.post_attention_layernorm.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.38.self_attn.k_proj.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.38.self_attn.o_proj.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.38.self_attn.q_proj.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.38.self_attn.v_proj.weight": "pytorch_model-00058-of-00191.bin", + "model.layers.39.input_layernorm.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.39.mlp.down_proj.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.39.mlp.gate_proj.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.39.mlp.up_proj.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.39.post_attention_layernorm.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.39.self_attn.k_proj.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.39.self_attn.o_proj.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.39.self_attn.q_proj.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.39.self_attn.v_proj.weight": "pytorch_model-00060-of-00191.bin", + "model.layers.4.input_layernorm.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.4.mlp.down_proj.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.4.mlp.gate_proj.weight": "pytorch_model-00008-of-00191.bin", + "model.layers.4.mlp.up_proj.weight": "pytorch_model-00008-of-00191.bin", + "model.layers.4.post_attention_layernorm.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.4.self_attn.k_proj.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.4.self_attn.o_proj.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.4.self_attn.q_proj.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.4.self_attn.v_proj.weight": "pytorch_model-00007-of-00191.bin", + "model.layers.40.input_layernorm.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.40.mlp.down_proj.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.40.mlp.gate_proj.weight": "pytorch_model-00062-of-00191.bin", + "model.layers.40.mlp.up_proj.weight": "pytorch_model-00062-of-00191.bin", + "model.layers.40.post_attention_layernorm.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.40.self_attn.k_proj.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.40.self_attn.o_proj.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.40.self_attn.q_proj.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.40.self_attn.v_proj.weight": "pytorch_model-00061-of-00191.bin", + "model.layers.41.input_layernorm.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.41.mlp.down_proj.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.41.mlp.gate_proj.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.41.mlp.up_proj.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.41.post_attention_layernorm.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.41.self_attn.k_proj.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.41.self_attn.o_proj.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.41.self_attn.q_proj.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.41.self_attn.v_proj.weight": "pytorch_model-00063-of-00191.bin", + "model.layers.42.input_layernorm.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.42.mlp.down_proj.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.42.mlp.gate_proj.weight": "pytorch_model-00065-of-00191.bin", + "model.layers.42.mlp.up_proj.weight": "pytorch_model-00065-of-00191.bin", + "model.layers.42.post_attention_layernorm.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.42.self_attn.k_proj.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.42.self_attn.o_proj.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.42.self_attn.q_proj.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.42.self_attn.v_proj.weight": "pytorch_model-00064-of-00191.bin", + "model.layers.43.input_layernorm.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.43.mlp.down_proj.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.43.mlp.gate_proj.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.43.mlp.up_proj.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.43.post_attention_layernorm.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.43.self_attn.k_proj.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.43.self_attn.o_proj.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.43.self_attn.q_proj.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.43.self_attn.v_proj.weight": "pytorch_model-00066-of-00191.bin", + "model.layers.44.input_layernorm.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.44.mlp.down_proj.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.44.mlp.gate_proj.weight": "pytorch_model-00068-of-00191.bin", + "model.layers.44.mlp.up_proj.weight": "pytorch_model-00068-of-00191.bin", + "model.layers.44.post_attention_layernorm.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.44.self_attn.k_proj.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.44.self_attn.o_proj.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.44.self_attn.q_proj.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.44.self_attn.v_proj.weight": "pytorch_model-00067-of-00191.bin", + "model.layers.45.input_layernorm.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.45.mlp.down_proj.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.45.mlp.gate_proj.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.45.mlp.up_proj.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.45.post_attention_layernorm.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.45.self_attn.k_proj.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.45.self_attn.o_proj.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.45.self_attn.q_proj.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.45.self_attn.v_proj.weight": "pytorch_model-00069-of-00191.bin", + "model.layers.46.input_layernorm.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.46.mlp.down_proj.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.46.mlp.gate_proj.weight": "pytorch_model-00071-of-00191.bin", + "model.layers.46.mlp.up_proj.weight": "pytorch_model-00071-of-00191.bin", + "model.layers.46.post_attention_layernorm.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.46.self_attn.k_proj.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.46.self_attn.o_proj.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.46.self_attn.q_proj.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.46.self_attn.v_proj.weight": "pytorch_model-00070-of-00191.bin", + "model.layers.47.input_layernorm.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.47.mlp.down_proj.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.47.mlp.gate_proj.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.47.mlp.up_proj.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.47.post_attention_layernorm.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.47.self_attn.k_proj.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.47.self_attn.o_proj.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.47.self_attn.q_proj.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.47.self_attn.v_proj.weight": "pytorch_model-00072-of-00191.bin", + "model.layers.48.input_layernorm.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.48.mlp.down_proj.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.48.mlp.gate_proj.weight": "pytorch_model-00074-of-00191.bin", + "model.layers.48.mlp.up_proj.weight": "pytorch_model-00074-of-00191.bin", + "model.layers.48.post_attention_layernorm.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.48.self_attn.k_proj.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.48.self_attn.o_proj.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.48.self_attn.q_proj.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.48.self_attn.v_proj.weight": "pytorch_model-00073-of-00191.bin", + "model.layers.49.input_layernorm.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.49.mlp.down_proj.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.49.mlp.gate_proj.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.49.mlp.up_proj.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.49.post_attention_layernorm.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.49.self_attn.k_proj.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.49.self_attn.o_proj.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.49.self_attn.q_proj.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.49.self_attn.v_proj.weight": "pytorch_model-00075-of-00191.bin", + "model.layers.5.input_layernorm.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.5.mlp.down_proj.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.5.mlp.gate_proj.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.5.mlp.up_proj.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.5.post_attention_layernorm.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.5.self_attn.k_proj.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.5.self_attn.o_proj.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.5.self_attn.q_proj.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.5.self_attn.v_proj.weight": "pytorch_model-00009-of-00191.bin", + "model.layers.50.input_layernorm.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.50.mlp.down_proj.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.50.mlp.gate_proj.weight": "pytorch_model-00077-of-00191.bin", + "model.layers.50.mlp.up_proj.weight": "pytorch_model-00077-of-00191.bin", + "model.layers.50.post_attention_layernorm.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.50.self_attn.k_proj.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.50.self_attn.o_proj.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.50.self_attn.q_proj.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.50.self_attn.v_proj.weight": "pytorch_model-00076-of-00191.bin", + "model.layers.51.input_layernorm.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.51.mlp.down_proj.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.51.mlp.gate_proj.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.51.mlp.up_proj.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.51.post_attention_layernorm.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.51.self_attn.k_proj.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.51.self_attn.o_proj.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.51.self_attn.q_proj.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.51.self_attn.v_proj.weight": "pytorch_model-00078-of-00191.bin", + "model.layers.52.input_layernorm.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.52.mlp.down_proj.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.52.mlp.gate_proj.weight": "pytorch_model-00080-of-00191.bin", + "model.layers.52.mlp.up_proj.weight": "pytorch_model-00080-of-00191.bin", + "model.layers.52.post_attention_layernorm.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.52.self_attn.k_proj.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.52.self_attn.o_proj.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.52.self_attn.q_proj.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.52.self_attn.v_proj.weight": "pytorch_model-00079-of-00191.bin", + "model.layers.53.input_layernorm.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.53.mlp.down_proj.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.53.mlp.gate_proj.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.53.mlp.up_proj.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.53.post_attention_layernorm.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.53.self_attn.k_proj.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.53.self_attn.o_proj.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.53.self_attn.q_proj.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.53.self_attn.v_proj.weight": "pytorch_model-00081-of-00191.bin", + "model.layers.54.input_layernorm.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.54.mlp.down_proj.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.54.mlp.gate_proj.weight": "pytorch_model-00083-of-00191.bin", + "model.layers.54.mlp.up_proj.weight": "pytorch_model-00083-of-00191.bin", + "model.layers.54.post_attention_layernorm.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.54.self_attn.k_proj.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.54.self_attn.o_proj.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.54.self_attn.q_proj.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.54.self_attn.v_proj.weight": "pytorch_model-00082-of-00191.bin", + "model.layers.55.input_layernorm.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.55.mlp.down_proj.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.55.mlp.gate_proj.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.55.mlp.up_proj.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.55.post_attention_layernorm.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.55.self_attn.k_proj.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.55.self_attn.o_proj.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.55.self_attn.q_proj.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.55.self_attn.v_proj.weight": "pytorch_model-00084-of-00191.bin", + "model.layers.56.input_layernorm.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.56.mlp.down_proj.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.56.mlp.gate_proj.weight": "pytorch_model-00086-of-00191.bin", + "model.layers.56.mlp.up_proj.weight": "pytorch_model-00086-of-00191.bin", + "model.layers.56.post_attention_layernorm.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.56.self_attn.k_proj.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.56.self_attn.o_proj.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.56.self_attn.q_proj.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.56.self_attn.v_proj.weight": "pytorch_model-00085-of-00191.bin", + "model.layers.57.input_layernorm.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.57.mlp.down_proj.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.57.mlp.gate_proj.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.57.mlp.up_proj.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.57.post_attention_layernorm.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.57.self_attn.k_proj.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.57.self_attn.o_proj.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.57.self_attn.q_proj.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.57.self_attn.v_proj.weight": "pytorch_model-00087-of-00191.bin", + "model.layers.58.input_layernorm.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.58.mlp.down_proj.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.58.mlp.gate_proj.weight": "pytorch_model-00089-of-00191.bin", + "model.layers.58.mlp.up_proj.weight": "pytorch_model-00089-of-00191.bin", + "model.layers.58.post_attention_layernorm.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.58.self_attn.k_proj.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.58.self_attn.o_proj.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.58.self_attn.q_proj.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.58.self_attn.v_proj.weight": "pytorch_model-00088-of-00191.bin", + "model.layers.59.input_layernorm.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.59.mlp.down_proj.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.59.mlp.gate_proj.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.59.mlp.up_proj.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.59.post_attention_layernorm.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.59.self_attn.k_proj.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.59.self_attn.o_proj.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.59.self_attn.q_proj.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.59.self_attn.v_proj.weight": "pytorch_model-00090-of-00191.bin", + "model.layers.6.input_layernorm.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.6.mlp.down_proj.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.6.mlp.gate_proj.weight": "pytorch_model-00011-of-00191.bin", + "model.layers.6.mlp.up_proj.weight": "pytorch_model-00011-of-00191.bin", + "model.layers.6.post_attention_layernorm.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.6.self_attn.k_proj.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.6.self_attn.o_proj.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.6.self_attn.q_proj.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.6.self_attn.v_proj.weight": "pytorch_model-00010-of-00191.bin", + "model.layers.60.input_layernorm.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.60.mlp.down_proj.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.60.mlp.gate_proj.weight": "pytorch_model-00092-of-00191.bin", + "model.layers.60.mlp.up_proj.weight": "pytorch_model-00092-of-00191.bin", + "model.layers.60.post_attention_layernorm.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.60.self_attn.k_proj.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.60.self_attn.o_proj.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.60.self_attn.q_proj.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.60.self_attn.v_proj.weight": "pytorch_model-00091-of-00191.bin", + "model.layers.61.input_layernorm.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.61.mlp.down_proj.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.61.mlp.gate_proj.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.61.mlp.up_proj.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.61.post_attention_layernorm.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.61.self_attn.k_proj.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.61.self_attn.o_proj.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.61.self_attn.q_proj.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.61.self_attn.v_proj.weight": "pytorch_model-00093-of-00191.bin", + "model.layers.62.input_layernorm.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.62.mlp.down_proj.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.62.mlp.gate_proj.weight": "pytorch_model-00095-of-00191.bin", + "model.layers.62.mlp.up_proj.weight": "pytorch_model-00095-of-00191.bin", + "model.layers.62.post_attention_layernorm.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.62.self_attn.k_proj.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.62.self_attn.o_proj.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.62.self_attn.q_proj.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.62.self_attn.v_proj.weight": "pytorch_model-00094-of-00191.bin", + "model.layers.63.input_layernorm.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.63.mlp.down_proj.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.63.mlp.gate_proj.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.63.mlp.up_proj.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.63.post_attention_layernorm.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.63.self_attn.k_proj.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.63.self_attn.o_proj.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.63.self_attn.q_proj.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.63.self_attn.v_proj.weight": "pytorch_model-00096-of-00191.bin", + "model.layers.64.input_layernorm.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.64.mlp.down_proj.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.64.mlp.gate_proj.weight": "pytorch_model-00098-of-00191.bin", + "model.layers.64.mlp.up_proj.weight": "pytorch_model-00098-of-00191.bin", + "model.layers.64.post_attention_layernorm.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.64.self_attn.k_proj.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.64.self_attn.o_proj.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.64.self_attn.q_proj.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.64.self_attn.v_proj.weight": "pytorch_model-00097-of-00191.bin", + "model.layers.65.input_layernorm.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.65.mlp.down_proj.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.65.mlp.gate_proj.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.65.mlp.up_proj.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.65.post_attention_layernorm.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.65.self_attn.k_proj.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.65.self_attn.o_proj.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.65.self_attn.q_proj.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.65.self_attn.v_proj.weight": "pytorch_model-00099-of-00191.bin", + "model.layers.66.input_layernorm.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.66.mlp.down_proj.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.66.mlp.gate_proj.weight": "pytorch_model-00101-of-00191.bin", + "model.layers.66.mlp.up_proj.weight": "pytorch_model-00101-of-00191.bin", + "model.layers.66.post_attention_layernorm.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.66.self_attn.k_proj.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.66.self_attn.o_proj.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.66.self_attn.q_proj.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.66.self_attn.v_proj.weight": "pytorch_model-00100-of-00191.bin", + "model.layers.67.input_layernorm.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.67.mlp.down_proj.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.67.mlp.gate_proj.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.67.mlp.up_proj.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.67.post_attention_layernorm.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.67.self_attn.k_proj.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.67.self_attn.o_proj.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.67.self_attn.q_proj.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.67.self_attn.v_proj.weight": "pytorch_model-00102-of-00191.bin", + "model.layers.68.input_layernorm.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.68.mlp.down_proj.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.68.mlp.gate_proj.weight": "pytorch_model-00104-of-00191.bin", + "model.layers.68.mlp.up_proj.weight": "pytorch_model-00104-of-00191.bin", + "model.layers.68.post_attention_layernorm.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.68.self_attn.k_proj.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.68.self_attn.o_proj.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.68.self_attn.q_proj.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.68.self_attn.v_proj.weight": "pytorch_model-00103-of-00191.bin", + "model.layers.69.input_layernorm.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.69.mlp.down_proj.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.69.mlp.gate_proj.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.69.mlp.up_proj.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.69.post_attention_layernorm.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.69.self_attn.k_proj.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.69.self_attn.o_proj.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.69.self_attn.q_proj.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.69.self_attn.v_proj.weight": "pytorch_model-00105-of-00191.bin", + "model.layers.7.input_layernorm.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.7.mlp.down_proj.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.7.mlp.gate_proj.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.7.mlp.up_proj.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.7.post_attention_layernorm.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.7.self_attn.k_proj.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.7.self_attn.o_proj.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.7.self_attn.q_proj.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.7.self_attn.v_proj.weight": "pytorch_model-00012-of-00191.bin", + "model.layers.70.input_layernorm.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.70.mlp.down_proj.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.70.mlp.gate_proj.weight": "pytorch_model-00107-of-00191.bin", + "model.layers.70.mlp.up_proj.weight": "pytorch_model-00107-of-00191.bin", + "model.layers.70.post_attention_layernorm.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.70.self_attn.k_proj.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.70.self_attn.o_proj.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.70.self_attn.q_proj.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.70.self_attn.v_proj.weight": "pytorch_model-00106-of-00191.bin", + "model.layers.71.input_layernorm.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.71.mlp.down_proj.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.71.mlp.gate_proj.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.71.mlp.up_proj.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.71.post_attention_layernorm.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.71.self_attn.k_proj.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.71.self_attn.o_proj.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.71.self_attn.q_proj.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.71.self_attn.v_proj.weight": "pytorch_model-00108-of-00191.bin", + "model.layers.72.input_layernorm.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.72.mlp.down_proj.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.72.mlp.gate_proj.weight": "pytorch_model-00110-of-00191.bin", + "model.layers.72.mlp.up_proj.weight": "pytorch_model-00110-of-00191.bin", + "model.layers.72.post_attention_layernorm.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.72.self_attn.k_proj.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.72.self_attn.o_proj.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.72.self_attn.q_proj.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.72.self_attn.v_proj.weight": "pytorch_model-00109-of-00191.bin", + "model.layers.73.input_layernorm.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.73.mlp.down_proj.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.73.mlp.gate_proj.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.73.mlp.up_proj.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.73.post_attention_layernorm.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.73.self_attn.k_proj.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.73.self_attn.o_proj.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.73.self_attn.q_proj.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.73.self_attn.v_proj.weight": "pytorch_model-00111-of-00191.bin", + "model.layers.74.input_layernorm.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.74.mlp.down_proj.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.74.mlp.gate_proj.weight": "pytorch_model-00113-of-00191.bin", + "model.layers.74.mlp.up_proj.weight": "pytorch_model-00113-of-00191.bin", + "model.layers.74.post_attention_layernorm.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.74.self_attn.k_proj.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.74.self_attn.o_proj.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.74.self_attn.q_proj.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.74.self_attn.v_proj.weight": "pytorch_model-00112-of-00191.bin", + "model.layers.75.input_layernorm.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.75.mlp.down_proj.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.75.mlp.gate_proj.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.75.mlp.up_proj.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.75.post_attention_layernorm.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.75.self_attn.k_proj.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.75.self_attn.o_proj.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.75.self_attn.q_proj.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.75.self_attn.v_proj.weight": "pytorch_model-00114-of-00191.bin", + "model.layers.76.input_layernorm.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.76.mlp.down_proj.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.76.mlp.gate_proj.weight": "pytorch_model-00116-of-00191.bin", + "model.layers.76.mlp.up_proj.weight": "pytorch_model-00116-of-00191.bin", + "model.layers.76.post_attention_layernorm.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.76.self_attn.k_proj.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.76.self_attn.o_proj.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.76.self_attn.q_proj.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.76.self_attn.v_proj.weight": "pytorch_model-00115-of-00191.bin", + "model.layers.77.input_layernorm.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.77.mlp.down_proj.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.77.mlp.gate_proj.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.77.mlp.up_proj.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.77.post_attention_layernorm.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.77.self_attn.k_proj.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.77.self_attn.o_proj.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.77.self_attn.q_proj.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.77.self_attn.v_proj.weight": "pytorch_model-00117-of-00191.bin", + "model.layers.78.input_layernorm.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.78.mlp.down_proj.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.78.mlp.gate_proj.weight": "pytorch_model-00119-of-00191.bin", + "model.layers.78.mlp.up_proj.weight": "pytorch_model-00119-of-00191.bin", + "model.layers.78.post_attention_layernorm.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.78.self_attn.k_proj.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.78.self_attn.o_proj.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.78.self_attn.q_proj.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.78.self_attn.v_proj.weight": "pytorch_model-00118-of-00191.bin", + "model.layers.79.input_layernorm.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.79.mlp.down_proj.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.79.mlp.gate_proj.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.79.mlp.up_proj.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.79.post_attention_layernorm.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.79.self_attn.k_proj.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.79.self_attn.o_proj.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.79.self_attn.q_proj.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.79.self_attn.v_proj.weight": "pytorch_model-00120-of-00191.bin", + "model.layers.8.input_layernorm.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.8.mlp.down_proj.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.8.mlp.gate_proj.weight": "pytorch_model-00014-of-00191.bin", + "model.layers.8.mlp.up_proj.weight": "pytorch_model-00014-of-00191.bin", + "model.layers.8.post_attention_layernorm.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.8.self_attn.k_proj.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.8.self_attn.o_proj.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.8.self_attn.q_proj.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.8.self_attn.v_proj.weight": "pytorch_model-00013-of-00191.bin", + "model.layers.80.input_layernorm.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.80.mlp.down_proj.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.80.mlp.gate_proj.weight": "pytorch_model-00122-of-00191.bin", + "model.layers.80.mlp.up_proj.weight": "pytorch_model-00122-of-00191.bin", + "model.layers.80.post_attention_layernorm.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.80.self_attn.k_proj.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.80.self_attn.o_proj.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.80.self_attn.q_proj.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.80.self_attn.v_proj.weight": "pytorch_model-00121-of-00191.bin", + "model.layers.81.input_layernorm.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.81.mlp.down_proj.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.81.mlp.gate_proj.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.81.mlp.up_proj.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.81.post_attention_layernorm.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.81.self_attn.k_proj.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.81.self_attn.o_proj.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.81.self_attn.q_proj.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.81.self_attn.v_proj.weight": "pytorch_model-00123-of-00191.bin", + "model.layers.82.input_layernorm.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.82.mlp.down_proj.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.82.mlp.gate_proj.weight": "pytorch_model-00125-of-00191.bin", + "model.layers.82.mlp.up_proj.weight": "pytorch_model-00125-of-00191.bin", + "model.layers.82.post_attention_layernorm.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.82.self_attn.k_proj.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.82.self_attn.o_proj.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.82.self_attn.q_proj.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.82.self_attn.v_proj.weight": "pytorch_model-00124-of-00191.bin", + "model.layers.83.input_layernorm.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.83.mlp.down_proj.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.83.mlp.gate_proj.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.83.mlp.up_proj.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.83.post_attention_layernorm.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.83.self_attn.k_proj.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.83.self_attn.o_proj.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.83.self_attn.q_proj.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.83.self_attn.v_proj.weight": "pytorch_model-00126-of-00191.bin", + "model.layers.84.input_layernorm.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.84.mlp.down_proj.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.84.mlp.gate_proj.weight": "pytorch_model-00128-of-00191.bin", + "model.layers.84.mlp.up_proj.weight": "pytorch_model-00128-of-00191.bin", + "model.layers.84.post_attention_layernorm.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.84.self_attn.k_proj.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.84.self_attn.o_proj.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.84.self_attn.q_proj.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.84.self_attn.v_proj.weight": "pytorch_model-00127-of-00191.bin", + "model.layers.85.input_layernorm.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.85.mlp.down_proj.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.85.mlp.gate_proj.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.85.mlp.up_proj.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.85.post_attention_layernorm.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.85.self_attn.k_proj.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.85.self_attn.o_proj.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.85.self_attn.q_proj.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.85.self_attn.v_proj.weight": "pytorch_model-00129-of-00191.bin", + "model.layers.86.input_layernorm.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.86.mlp.down_proj.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.86.mlp.gate_proj.weight": "pytorch_model-00131-of-00191.bin", + "model.layers.86.mlp.up_proj.weight": "pytorch_model-00131-of-00191.bin", + "model.layers.86.post_attention_layernorm.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.86.self_attn.k_proj.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.86.self_attn.o_proj.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.86.self_attn.q_proj.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.86.self_attn.v_proj.weight": "pytorch_model-00130-of-00191.bin", + "model.layers.87.input_layernorm.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.87.mlp.down_proj.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.87.mlp.gate_proj.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.87.mlp.up_proj.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.87.post_attention_layernorm.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.87.self_attn.k_proj.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.87.self_attn.o_proj.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.87.self_attn.q_proj.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.87.self_attn.v_proj.weight": "pytorch_model-00132-of-00191.bin", + "model.layers.88.input_layernorm.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.88.mlp.down_proj.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.88.mlp.gate_proj.weight": "pytorch_model-00134-of-00191.bin", + "model.layers.88.mlp.up_proj.weight": "pytorch_model-00134-of-00191.bin", + "model.layers.88.post_attention_layernorm.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.88.self_attn.k_proj.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.88.self_attn.o_proj.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.88.self_attn.q_proj.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.88.self_attn.v_proj.weight": "pytorch_model-00133-of-00191.bin", + "model.layers.89.input_layernorm.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.89.mlp.down_proj.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.89.mlp.gate_proj.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.89.mlp.up_proj.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.89.post_attention_layernorm.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.89.self_attn.k_proj.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.89.self_attn.o_proj.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.89.self_attn.q_proj.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.89.self_attn.v_proj.weight": "pytorch_model-00135-of-00191.bin", + "model.layers.9.input_layernorm.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.9.mlp.down_proj.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.9.mlp.gate_proj.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.9.mlp.up_proj.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.9.post_attention_layernorm.weight": "pytorch_model-00016-of-00191.bin", + "model.layers.9.self_attn.k_proj.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.9.self_attn.o_proj.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.9.self_attn.q_proj.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.9.self_attn.v_proj.weight": "pytorch_model-00015-of-00191.bin", + "model.layers.90.input_layernorm.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.90.mlp.down_proj.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.90.mlp.gate_proj.weight": "pytorch_model-00137-of-00191.bin", + "model.layers.90.mlp.up_proj.weight": "pytorch_model-00137-of-00191.bin", + "model.layers.90.post_attention_layernorm.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.90.self_attn.k_proj.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.90.self_attn.o_proj.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.90.self_attn.q_proj.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.90.self_attn.v_proj.weight": "pytorch_model-00136-of-00191.bin", + "model.layers.91.input_layernorm.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.91.mlp.down_proj.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.91.mlp.gate_proj.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.91.mlp.up_proj.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.91.post_attention_layernorm.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.91.self_attn.k_proj.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.91.self_attn.o_proj.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.91.self_attn.q_proj.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.91.self_attn.v_proj.weight": "pytorch_model-00138-of-00191.bin", + "model.layers.92.input_layernorm.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.92.mlp.down_proj.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.92.mlp.gate_proj.weight": "pytorch_model-00140-of-00191.bin", + "model.layers.92.mlp.up_proj.weight": "pytorch_model-00140-of-00191.bin", + "model.layers.92.post_attention_layernorm.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.92.self_attn.k_proj.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.92.self_attn.o_proj.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.92.self_attn.q_proj.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.92.self_attn.v_proj.weight": "pytorch_model-00139-of-00191.bin", + "model.layers.93.input_layernorm.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.93.mlp.down_proj.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.93.mlp.gate_proj.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.93.mlp.up_proj.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.93.post_attention_layernorm.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.93.self_attn.k_proj.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.93.self_attn.o_proj.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.93.self_attn.q_proj.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.93.self_attn.v_proj.weight": "pytorch_model-00141-of-00191.bin", + "model.layers.94.input_layernorm.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.94.mlp.down_proj.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.94.mlp.gate_proj.weight": "pytorch_model-00143-of-00191.bin", + "model.layers.94.mlp.up_proj.weight": "pytorch_model-00143-of-00191.bin", + "model.layers.94.post_attention_layernorm.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.94.self_attn.k_proj.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.94.self_attn.o_proj.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.94.self_attn.q_proj.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.94.self_attn.v_proj.weight": "pytorch_model-00142-of-00191.bin", + "model.layers.95.input_layernorm.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.95.mlp.down_proj.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.95.mlp.gate_proj.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.95.mlp.up_proj.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.95.post_attention_layernorm.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.95.self_attn.k_proj.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.95.self_attn.o_proj.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.95.self_attn.q_proj.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.95.self_attn.v_proj.weight": "pytorch_model-00144-of-00191.bin", + "model.layers.96.input_layernorm.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.96.mlp.down_proj.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.96.mlp.gate_proj.weight": "pytorch_model-00146-of-00191.bin", + "model.layers.96.mlp.up_proj.weight": "pytorch_model-00146-of-00191.bin", + "model.layers.96.post_attention_layernorm.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.96.self_attn.k_proj.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.96.self_attn.o_proj.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.96.self_attn.q_proj.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.96.self_attn.v_proj.weight": "pytorch_model-00145-of-00191.bin", + "model.layers.97.input_layernorm.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.97.mlp.down_proj.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.97.mlp.gate_proj.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.97.mlp.up_proj.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.97.post_attention_layernorm.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.97.self_attn.k_proj.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.97.self_attn.o_proj.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.97.self_attn.q_proj.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.97.self_attn.v_proj.weight": "pytorch_model-00147-of-00191.bin", + "model.layers.98.input_layernorm.weight": "pytorch_model-00150-of-00191.bin", + "model.layers.98.mlp.down_proj.weight": "pytorch_model-00150-of-00191.bin", + "model.layers.98.mlp.gate_proj.weight": "pytorch_model-00149-of-00191.bin", + "model.layers.98.mlp.up_proj.weight": "pytorch_model-00149-of-00191.bin", + "model.layers.98.post_attention_layernorm.weight": "pytorch_model-00150-of-00191.bin", + "model.layers.98.self_attn.k_proj.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.98.self_attn.o_proj.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.98.self_attn.q_proj.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.98.self_attn.v_proj.weight": "pytorch_model-00148-of-00191.bin", + "model.layers.99.input_layernorm.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.99.mlp.down_proj.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.99.mlp.gate_proj.weight": "pytorch_model-00150-of-00191.bin", + "model.layers.99.mlp.up_proj.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.99.post_attention_layernorm.weight": "pytorch_model-00151-of-00191.bin", + "model.layers.99.self_attn.k_proj.weight": "pytorch_model-00150-of-00191.bin", + "model.layers.99.self_attn.o_proj.weight": "pytorch_model-00150-of-00191.bin", + "model.layers.99.self_attn.q_proj.weight": "pytorch_model-00150-of-00191.bin", + "model.layers.99.self_attn.v_proj.weight": "pytorch_model-00150-of-00191.bin", + "model.norm.weight": "pytorch_model-00190-of-00191.bin" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..89af31a3c96c39011ffec99c32a770062be9dc7c --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,23 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..548e7b196b97b38c45068d7a2bcedfbb444546cd --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9400df98529060210393c40f08cb127f7c0df584338b3fbfdba8cf82a33c1ade +size 17210102 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..ef8218534a4cd20717275b6ae849b35d4821ba1d --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2072 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|finetune_right_pad_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|eom_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|python_tag|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128256": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "chat_template": "{% for message in messages %}{% if message['role'] == 'system' %}{{ '<|system|>\n' + message['content'] + '\n' }}{% elif message['role'] == 'user' %}{{ '<|user|>\n' + message['content'] + '\n' }}{% elif message['role'] == 'assistant' %}{% if not loop.last %}{{ '<|assistant|>\n' + message['content'] + eos_token + '\n' }}{% else %}{{ '<|assistant|>\n' + message['content'] + eos_token }}{% endif %}{% endif %}{% if loop.last and add_generation_prompt %}{{ '<|assistant|>\n' }}{% endif %}{% endfor %}", + "clean_up_tokenization_spaces": true, + "eos_token": "<|end_of_text|>", + "extra_special_tokens": {}, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 131072, + "pad_token": "", + "tokenizer_class": "PreTrainedTokenizerFast" +}