diff --git "a/ndarray-cache.json" "b/ndarray-cache.json" --- "a/ndarray-cache.json" +++ "b/ndarray-cache.json" @@ -1,8 +1,8 @@ { "metadata": { - "ParamSize": 869, - "ParamBytes": 1873364948.0, - "BitsPerParam": 3.7021917590823534 + "ParamSize": 724, + "ParamBytes": 2340679936.0, + "BitsPerParam": 4.625711599312261 }, "records": [ { @@ -22,7 +22,7 @@ "byteOffset": 0 } ], - "md5sum": "8a35ddbbc2ab05256c6c2d54d6094fda" + "md5sum": "d7e1c53f4ed3388ab3651a4ac7fe5c3b" }, { "dataPath": "params_shard_1.bin", @@ -41,7 +41,7 @@ "byteOffset": 0 } ], - "md5sum": "5e643ec4c20f60ffaeae2a841566cd75" + "md5sum": "bbe371e4c6556993e74003d072d5a519" }, { "dataPath": "params_shard_2.bin", @@ -145,7 +145,7 @@ "byteOffset": 31582336 } ], - "md5sum": "24fab578168aeadbc9559a578c7183e7" + "md5sum": "8eb6f7a52bf759728f53f0245c72a859" }, { "dataPath": "params_shard_3.bin", @@ -186,7 +186,7 @@ "byteOffset": 11335680 } ], - "md5sum": "419b98c8f9ad7d166c3979d8d9c7559b" + "md5sum": "2ba63895330a62bc1318c87c5d5072ce" }, { "dataPath": "params_shard_4.bin", @@ -205,7 +205,7 @@ "byteOffset": 0 } ], - "md5sum": "1664118860d52dd98f030f503f04ad24" + "md5sum": "9456eef90ffdc61e81ffe0800109e762" }, { "dataPath": "params_shard_5.bin", @@ -331,7 +331,7 @@ "byteOffset": 33425408 } ], - "md5sum": "c2a46d96f42d25691193feaf4dfdb7f2" + "md5sum": "cd6b9aa2b41c2140645eefb808a8a2e3" }, { "dataPath": "params_shard_6.bin", @@ -350,7 +350,7 @@ "byteOffset": 0 } ], - "md5sum": "5a0644c2a7b96ecc7f44db61c76980b1" + "md5sum": "4ec6c96f6227fce6dbe6a251dad201f3" }, { "dataPath": "params_shard_7.bin", @@ -455,7 +455,7 @@ "byteOffset": 30896128 } ], - "md5sum": "e207ed95b32cf79cd2023cf0ec11d8c7" + "md5sum": "30f769a15fbdac43ca45e6812ffecbfb" }, { "dataPath": "params_shard_8.bin", @@ -474,7 +474,7 @@ "byteOffset": 0 } ], - "md5sum": "f4302a88dfb0c1dd8f39023f158eecb1" + "md5sum": "3e20b5efdce2e340dbb820d88b3cb7e0" }, { "dataPath": "params_shard_9.bin", @@ -579,7 +579,7 @@ "byteOffset": 30896128 } ], - "md5sum": "526c77bf2a28ad9f696f99d2f36324b5" + "md5sum": "5bbad59fbf3fd94682eb75a071e0f264" }, { "dataPath": "params_shard_10.bin", @@ -598,7 +598,7 @@ "byteOffset": 0 } ], - "md5sum": "7d502dc51f0b4ba087038840e2e3fa2a" + "md5sum": "5c710bda058fe56ce812112e1b0f0ee0" }, { "dataPath": "params_shard_11.bin", @@ -703,7 +703,7 @@ "byteOffset": 30896128 } ], - "md5sum": "40b08c6e4a04c85dcc8d20763a131aaa" + "md5sum": "7a15e2962ed42b63453eaecd837ff275" }, { "dataPath": "params_shard_12.bin", @@ -722,7 +722,7 @@ "byteOffset": 0 } ], - "md5sum": "ad0c16081945fd54ca9d5bf88322cf6e" + "md5sum": "0a10e859199899afd04e346c84ef3eef" }, { "dataPath": "params_shard_13.bin", @@ -827,7 +827,7 @@ "byteOffset": 30896128 } ], - "md5sum": "ff97580cc8b519c9a0dafbec95ce9076" + "md5sum": "6bc76013f6066d9569517976841883eb" }, { "dataPath": "params_shard_14.bin", @@ -846,7 +846,7 @@ "byteOffset": 0 } ], - "md5sum": "900c18766113eff094153343f44eae68" + "md5sum": "f734322260c53272938e682d4441e076" }, { "dataPath": "params_shard_15.bin", @@ -951,7 +951,7 @@ "byteOffset": 30896128 } ], - "md5sum": "354d4710d313309d24b60d9dc0d7de86" + "md5sum": "ad714acba2104718fb5491a432b197d1" }, { "dataPath": "params_shard_16.bin", @@ -970,7 +970,7 @@ "byteOffset": 0 } ], - "md5sum": "375e40a711c06214bcf155207c27c8df" + "md5sum": "348d7841fb570d2dc49bbb93d3679134" }, { "dataPath": "params_shard_17.bin", @@ -1075,7 +1075,7 @@ "byteOffset": 30896128 } ], - "md5sum": "2a08f7bdb8837cf2659d8d2d62b47cfb" + "md5sum": "6179ab639c1bda89b3c90cb50ae11762" }, { "dataPath": "params_shard_18.bin", @@ -1094,7 +1094,7 @@ "byteOffset": 0 } ], - "md5sum": "02e503ff2aa0900aa47e73d0b85ef80d" + "md5sum": "336989816dd64c49e7eadbdea61ca170" }, { "dataPath": "params_shard_19.bin", @@ -1199,7 +1199,7 @@ "byteOffset": 30896128 } ], - "md5sum": "089a8975a68756edba36ba294c67a8ef" + "md5sum": "da3b6c34fb6d830d6245f9c61818a068" }, { "dataPath": "params_shard_20.bin", @@ -1218,7 +1218,7 @@ "byteOffset": 0 } ], - "md5sum": "e55ee3c00cc9b2fc5db22c815ed1e35f" + "md5sum": "0640e92aa128f4e05a58d7c5cc356006" }, { "dataPath": "params_shard_21.bin", @@ -1323,7 +1323,7 @@ "byteOffset": 30896128 } ], - "md5sum": "f3478b8fbcd86f16cec0803918d5e3ec" + "md5sum": "db3317dfde5ff5e937017d05543c3792" }, { "dataPath": "params_shard_22.bin", @@ -1342,7 +1342,7 @@ "byteOffset": 0 } ], - "md5sum": "2d47274575a56cc29842d9f9413d801c" + "md5sum": "0e9f6c20144e7d9da545ac535987d49c" }, { "dataPath": "params_shard_23.bin", @@ -1447,7 +1447,7 @@ "byteOffset": 30896128 } ], - "md5sum": "6871519612a4b73c0d24e2b32bcfb785" + "md5sum": "5cd3f1298c7d3e2eba61c2dccaa51fa1" }, { "dataPath": "params_shard_24.bin", @@ -1466,7 +1466,7 @@ "byteOffset": 0 } ], - "md5sum": "b90a3c96a5a1207a3574ae02a48669ef" + "md5sum": "1d625599633f2e8fdd20ea38072c1a3a" }, { "dataPath": "params_shard_25.bin", @@ -1571,7 +1571,7 @@ "byteOffset": 30896128 } ], - "md5sum": "bd8f516641f37b8ab8fdfbf5341150d7" + "md5sum": "430a7c4d1d69396f3ec1eb880b7f716f" }, { "dataPath": "params_shard_26.bin", @@ -1590,7 +1590,7 @@ "byteOffset": 0 } ], - "md5sum": "5cad5fb8c628578200af5174a42c330d" + "md5sum": "25077b71bded2893f97467c767447e8f" }, { "dataPath": "params_shard_27.bin", @@ -1695,7 +1695,7 @@ "byteOffset": 30896128 } ], - "md5sum": "3aabdc1f95147e394d5de5df9697ef2b" + "md5sum": "2239b285a54e01bb80bccbf22c562d3f" }, { "dataPath": "params_shard_28.bin", @@ -1714,7 +1714,7 @@ "byteOffset": 0 } ], - "md5sum": "381023fb23574049257f2a0eec9b554f" + "md5sum": "5e7537fcb657900a598019c4ea92dc0a" }, { "dataPath": "params_shard_29.bin", @@ -1733,7 +1733,7 @@ "byteOffset": 0 } ], - "md5sum": "b05a8053cb19739cf76c4d5e303b95ed" + "md5sum": "8409accc0efa14b9bd2212b965b6d449" }, { "dataPath": "params_shard_30.bin", @@ -1838,7 +1838,7 @@ "byteOffset": 32057472 } ], - "md5sum": "55427a0d100d982af219140f2f1b3b19" + "md5sum": "897b4fd728d5eaf06f7e5e8eb9fff479" }, { "dataPath": "params_shard_31.bin", @@ -1857,7 +1857,7 @@ "byteOffset": 0 } ], - "md5sum": "655b2041eb3bc532b2f76f8a3044a80e" + "md5sum": "d3bc8dfb66a961ed8ff8d82d62f891e6" }, { "dataPath": "params_shard_32.bin", @@ -1983,7 +1983,7 @@ "byteOffset": 33425408 } ], - "md5sum": "60597c76e7ae98d8687f3ef6d24ef84d" + "md5sum": "9fa4180ca7f3d8d2671e424df58f7d33" }, { "dataPath": "params_shard_33.bin", @@ -2002,7 +2002,7 @@ "byteOffset": 0 } ], - "md5sum": "3beb4e5859d4d77a395a9cfcda94fd21" + "md5sum": "a3f57885456413befe772a61db9fe003" }, { "dataPath": "params_shard_34.bin", @@ -2107,7 +2107,7 @@ "byteOffset": 30896128 } ], - "md5sum": "a5a2e49eb5e992f4a4da8593a0e32c46" + "md5sum": "939e4d0a910d890d33ab3aa4cfae6527" }, { "dataPath": "params_shard_35.bin", @@ -2126,7 +2126,7 @@ "byteOffset": 0 } ], - "md5sum": "a5ee83fb741c7a33c7e86784d9be28d6" + "md5sum": "ba8cc1009d70aa580a3c3464ddcf2e1b" }, { "dataPath": "params_shard_36.bin", @@ -2231,7 +2231,7 @@ "byteOffset": 30896128 } ], - "md5sum": "8b09bdf75eba6d273336c78223a3fbac" + "md5sum": "cf73ece61d143b5685eef41c20229c42" }, { "dataPath": "params_shard_37.bin", @@ -2250,7 +2250,7 @@ "byteOffset": 0 } ], - "md5sum": "a3b6820d889f86491595e7c64a292346" + "md5sum": "62f2abbb1faa52d0bce9d55753794a88" }, { "dataPath": "params_shard_38.bin", @@ -2355,7 +2355,7 @@ "byteOffset": 30896128 } ], - "md5sum": "2cf21a5ab798e9a8424ba6c8d4475414" + "md5sum": "d2acdc47a3bc43aa505032d2bb8c15f3" }, { "dataPath": "params_shard_39.bin", @@ -2374,7 +2374,7 @@ "byteOffset": 0 } ], - "md5sum": "f4ab43131aa9a0ffee3815b901dc8591" + "md5sum": "bb5529cdb10895082d3b2e5293f6d1cd" }, { "dataPath": "params_shard_40.bin", @@ -2479,7 +2479,7 @@ "byteOffset": 30896128 } ], - "md5sum": "c0cb92677fedc090b87887989db52c5b" + "md5sum": "98ef5b4e63d4701a25201cdc3c05bf12" }, { "dataPath": "params_shard_41.bin", @@ -2498,7 +2498,7 @@ "byteOffset": 0 } ], - "md5sum": "0756b15ae5e75580f8a9f33f62914dda" + "md5sum": "24522563518632d9a17f4166066cb200" }, { "dataPath": "params_shard_42.bin", @@ -2603,7 +2603,7 @@ "byteOffset": 30896128 } ], - "md5sum": "f7ec2b75978886fca92ba13a6a511bf0" + "md5sum": "8d3fab7847a5c022d510e83f15c23ad7" }, { "dataPath": "params_shard_43.bin", @@ -2622,7 +2622,7 @@ "byteOffset": 0 } ], - "md5sum": "67c0eba6afa7bead6674cbc479f6b5a7" + "md5sum": "215dc6ff0a1f211c3727dcc991c46cf1" }, { "dataPath": "params_shard_44.bin", @@ -2727,7 +2727,7 @@ "byteOffset": 30896128 } ], - "md5sum": "f67124710df92edb87263cc95ca70806" + "md5sum": "72866c136adefde27ba78274ed57619a" }, { "dataPath": "params_shard_45.bin", @@ -2746,7 +2746,7 @@ "byteOffset": 0 } ], - "md5sum": "db05762038bee40f53680fbf656b91da" + "md5sum": "7f02d5ccf7cc2c4370777d6ae00b1244" }, { "dataPath": "params_shard_46.bin", @@ -2851,7 +2851,7 @@ "byteOffset": 30896128 } ], - "md5sum": "939795fea6dc100035f9fc0a49d711b0" + "md5sum": "30abcca65e41086ad0667aacaf53384b" }, { "dataPath": "params_shard_47.bin", @@ -2870,7 +2870,7 @@ "byteOffset": 0 } ], - "md5sum": "f9fb91d66e9fca6030f1ae038d840f00" + "md5sum": "69a2467ff910a2811ef2c4542bc4fe56" }, { "dataPath": "params_shard_48.bin", @@ -2975,7 +2975,7 @@ "byteOffset": 30896128 } ], - "md5sum": "8ab8d33f317b9a6c5c60140793ff0fd3" + "md5sum": "a22c8fb5e9fed8eeee2e25e97eebabaa" }, { "dataPath": "params_shard_49.bin", @@ -2994,7 +2994,7 @@ "byteOffset": 0 } ], - "md5sum": "d02c9a6a3e469a42b7727dcbe8da5372" + "md5sum": "de1a4314be8c30ee24e9f222493b0f5b" }, { "dataPath": "params_shard_50.bin", @@ -3100,7 +3100,7 @@ "byteOffset": 31371264 } ], - "md5sum": "34bb78bf6f0142eae8fc499be2eae4a1" + "md5sum": "e236c8247a12c058d052abe0ae7fc877" }, { "dataPath": "params_shard_51.bin", @@ -3119,7 +3119,7 @@ "byteOffset": 0 } ], - "md5sum": "1b55a46a61b4c4c44d98239d787cf521" + "md5sum": "8d311f71a279bc57e82db1bfee4377e0" }, { "dataPath": "params_shard_52.bin", @@ -3245,7 +3245,7 @@ "byteOffset": 33425408 } ], - "md5sum": "8cdb1371166272e1a9084901fc4be2f2" + "md5sum": "64e85992e12b41d931b4135988285364" }, { "dataPath": "params_shard_53.bin", @@ -3264,7 +3264,7 @@ "byteOffset": 0 } ], - "md5sum": "8d9bb581a610c0f8253fb86edb63b3e7" + "md5sum": "c9311d3be9641447bf58117d7e8c58a7" }, { "dataPath": "params_shard_54.bin", @@ -3369,7 +3369,7 @@ "byteOffset": 30896128 } ], - "md5sum": "35b6c52919b02d23fcc4eb6c96fa3939" + "md5sum": "d621aecf6605c376c716c5740763cd54" }, { "dataPath": "params_shard_55.bin", @@ -3388,7 +3388,7 @@ "byteOffset": 0 } ], - "md5sum": "4fdd2e740eb529f99aa42517aff952e1" + "md5sum": "d3b2599308c53564ab04eb7c13b15fad" }, { "dataPath": "params_shard_56.bin", @@ -3493,7 +3493,7 @@ "byteOffset": 30896128 } ], - "md5sum": "34d8e5a154849d6cd0e80c3cbfeb415a" + "md5sum": "efdbce3b0bdac0012a5351dde276b4cc" }, { "dataPath": "params_shard_57.bin", @@ -3512,7 +3512,7 @@ "byteOffset": 0 } ], - "md5sum": "5424057c52fefadd949acaf659270b4f" + "md5sum": "5e4f4154f7e37074b030ef2ba84f99fe" }, { "dataPath": "params_shard_58.bin", @@ -3617,7 +3617,7 @@ "byteOffset": 30896128 } ], - "md5sum": "d9a4476ee91dcd2b8b4e1fc21e62e3ae" + "md5sum": "852443b009f7b915ac3d3b9058bd8473" }, { "dataPath": "params_shard_59.bin", @@ -3636,7 +3636,7 @@ "byteOffset": 0 } ], - "md5sum": "3c7dfad2b08f7f7286e527bb245d0c22" + "md5sum": "e7e25940d67c00c1b8d30e56ea7d5fd4" }, { "dataPath": "params_shard_60.bin", @@ -3741,7 +3741,7 @@ "byteOffset": 30896128 } ], - "md5sum": "021ced36e57a5c9c9c4799aaa95aa1b3" + "md5sum": "94d1dfa1be75385702998e301115055a" }, { "dataPath": "params_shard_61.bin", @@ -3760,7 +3760,7 @@ "byteOffset": 0 } ], - "md5sum": "15b1fe414b809a835331cb0688bd903f" + "md5sum": "4608f00654ceaa9953c3daccb281330b" }, { "dataPath": "params_shard_62.bin", @@ -3865,7 +3865,7 @@ "byteOffset": 30896128 } ], - "md5sum": "7b85b21a4f10e21933aa76f10079d7c6" + "md5sum": "9bd35cc0fed109dedcb6e04ff7d162d2" }, { "dataPath": "params_shard_63.bin", @@ -3884,7 +3884,7 @@ "byteOffset": 0 } ], - "md5sum": "80ffcfa1ab4cb04357f75e1fcd6d2018" + "md5sum": "5f3ccfc709639df0a73db5ee3a960fb7" }, { "dataPath": "params_shard_64.bin", @@ -3989,12 +3989,12 @@ "byteOffset": 30896128 } ], - "md5sum": "1a6d6b9b372685fc903858f709c330d3" + "md5sum": "ad1237b06fbd0528c9f8e23cf79a8891" }, { "dataPath": "params_shard_65.bin", "format": "raw-shard", - "nbytes": 31968980, + "nbytes": 27834368, "records": [ { "name": "model.h.9.mixer.out_proj.q_weight", @@ -4076,26 +4076,15 @@ "byteOffset": 17041408 }, { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.weight", "shape": [ 577, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 240032, - "byteOffset": 18245632 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_scale", - "shape": [ - 577, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 30004, - "byteOffset": 18485664 + "nbytes": 1181696, + "byteOffset": 18245632 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.bias", @@ -4105,7 +4094,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18515668 + "byteOffset": 19427328 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.weight", @@ -4115,7 +4104,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18517716 + "byteOffset": 19429376 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.bias", @@ -4125,7 +4114,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18519764 + "byteOffset": 19431424 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.weight", @@ -4135,7 +4124,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18521812 + "byteOffset": 19433472 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.bias", @@ -4145,29 +4134,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18523860 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 18532052 + "byteOffset": 19435520 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 20235988 + "nbytes": 8388608, + "byteOffset": 19443712 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.bias", @@ -4177,29 +4155,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20448980 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 20451028 - }, + "byteOffset": 27832320 + } + ], + "md5sum": "e9f4130276ed5535299d74f5e68e0597" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 22138580 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.bias", @@ -4209,29 +4184,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22349524 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22351572 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22777556 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.bias", @@ -4241,29 +4205,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22830804 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22832852 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23258836 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.bias", @@ -4273,29 +4226,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23312084 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23314132 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23740116 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.bias", @@ -4305,29 +4247,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23793364 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23795412 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 24221396 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.bias", @@ -4337,7 +4268,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24274644 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.weight", @@ -4347,7 +4278,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24276692 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.bias", @@ -4357,7 +4288,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24278740 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.weight", @@ -4367,7 +4298,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24280788 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.bias", @@ -4377,29 +4308,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 24282836 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 24291028 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 25994964 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.bias", @@ -4409,29 +4329,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26207956 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 26210004 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "12ccc3786467895471d31bb5b1d2610c" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 27897556 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.bias", @@ -4441,29 +4358,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28108500 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28110548 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28536532 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.bias", @@ -4473,29 +4379,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28589780 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28591828 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29017812 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.bias", @@ -4505,29 +4400,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29071060 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 29073108 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29499092 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.bias", @@ -4537,29 +4421,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29552340 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 29554388 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29980372 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.bias", @@ -4569,7 +4442,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30033620 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.weight", @@ -4579,7 +4452,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30035668 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.bias", @@ -4589,7 +4462,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30037716 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.weight", @@ -4599,7 +4472,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30039764 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.bias", @@ -4609,29 +4482,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 30041812 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 30050004 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 31753940 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.bias", @@ -4641,37 +4503,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31966932 + "byteOffset": 25190400 } ], - "md5sum": "50ec01b6812197d7e6a45c6f47b0dfe5" + "md5sum": "dcc2adf61aa07fe189bb15874110e845" }, { - "dataPath": "params_shard_66.bin", + "dataPath": "params_shard_68.bin", "format": "raw-shard", - "nbytes": 32634880, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 0 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 1687552 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.bias", @@ -4681,29 +4532,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1898496 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 1900544 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 2326528 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.bias", @@ -4713,29 +4553,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2379776 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 2381824 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 2807808 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.bias", @@ -4745,29 +4574,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2861056 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 2863104 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 3289088 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.bias", @@ -4777,29 +4595,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3342336 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 3344384 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 3770368 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.bias", @@ -4809,7 +4616,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3823616 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.weight", @@ -4819,7 +4626,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3825664 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.bias", @@ -4829,7 +4636,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3827712 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.weight", @@ -4839,7 +4646,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3829760 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.bias", @@ -4849,29 +4656,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 3831808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 3840000 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 5543936 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.bias", @@ -4881,29 +4677,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5756928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 5758976 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "9f8d49d8894a05f4179ba707925e9d59" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 7446528 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.bias", @@ -4913,29 +4706,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7657472 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 7659520 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 8085504 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.bias", @@ -4945,29 +4727,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8138752 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 8140800 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 8566784 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.bias", @@ -4977,29 +4748,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8620032 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 8622080 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 9048064 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.bias", @@ -5009,29 +4769,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9101312 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 9103360 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 9529344 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.bias", @@ -5041,7 +4790,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9582592 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.weight", @@ -5051,7 +4800,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9584640 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.bias", @@ -5061,7 +4810,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9586688 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.weight", @@ -5071,7 +4820,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9588736 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.bias", @@ -5081,29 +4830,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 9590784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 9598976 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 11302912 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.bias", @@ -5113,29 +4851,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11515904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 11517952 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "19b6f5d2cfc839108f9156b8b521d3ce" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 13205504 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.bias", @@ -5145,29 +4880,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13416448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 13418496 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 13844480 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.bias", @@ -5177,29 +4901,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13897728 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 13899776 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 14325760 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.bias", @@ -5209,29 +4922,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14379008 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 14381056 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 14807040 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.bias", @@ -5241,29 +4943,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14860288 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 14862336 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 15288320 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.bias", @@ -5273,7 +4964,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15341568 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.weight", @@ -5283,7 +4974,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15343616 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.bias", @@ -5293,7 +4984,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15345664 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.weight", @@ -5303,7 +4994,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15347712 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.bias", @@ -5313,29 +5004,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 15349760 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 15357952 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 17061888 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.bias", @@ -5345,29 +5025,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17274880 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 17276928 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "3e6322c0673873144d67964c709fa3be" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 18964480 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.bias", @@ -5377,29 +5054,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19175424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 19177472 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 19603456 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.bias", @@ -5409,29 +5075,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19656704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 19658752 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 20084736 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.bias", @@ -5441,29 +5096,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20137984 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 20140032 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 20566016 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.bias", @@ -5473,29 +5117,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20619264 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 20621312 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 21047296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.bias", @@ -5505,7 +5138,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21100544 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.weight", @@ -5515,7 +5148,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21102592 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.bias", @@ -5525,7 +5158,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21104640 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.weight", @@ -5535,7 +5168,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21106688 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.bias", @@ -5545,29 +5178,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 21108736 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 21116928 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 22820864 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.bias", @@ -5577,29 +5199,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23033856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 23035904 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "f04370015a40ae2073f5d89ad86f1c42" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 24723456 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.bias", @@ -5609,29 +5228,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24934400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 24936448 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 25362432 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.bias", @@ -5641,29 +5249,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25415680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 25417728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 25843712 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.bias", @@ -5673,29 +5270,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25896960 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 25899008 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 26324992 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.bias", @@ -5705,29 +5291,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26378240 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 26380288 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 26806272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.bias", @@ -5737,7 +5312,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26859520 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.weight", @@ -5747,7 +5322,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26861568 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.bias", @@ -5757,7 +5332,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26863616 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.weight", @@ -5767,7 +5342,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26865664 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.bias", @@ -5777,29 +5352,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 26867712 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 26875904 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 28579840 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.bias", @@ -5809,29 +5373,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28792832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 28794880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e2c99d455ee851ede30d282481166453" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 30482432 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.bias", @@ -5841,29 +5402,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30693376 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 30695424 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 31121408 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.bias", @@ -5873,29 +5423,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31174656 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 31176704 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 31602688 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.bias", @@ -5905,29 +5444,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31655936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 31657984 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 32083968 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.bias", @@ -5937,29 +5465,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32137216 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 32139264 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 32565248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.bias", @@ -5969,7 +5486,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32618496 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.weight", @@ -5979,7 +5496,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32620544 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.bias", @@ -5989,7 +5506,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32622592 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.weight", @@ -5999,7 +5516,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32624640 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.bias", @@ -6009,37 +5526,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 32626688 - } - ], - "md5sum": "81c15ab7a906dcc39b7bf83864d4b44f" - }, - { - "dataPath": "params_shard_67.bin", - "format": "raw-shard", - "nbytes": 33521664, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 0 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 1703936 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.bias", @@ -6049,29 +5547,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1916928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 1918976 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "11c75f74757caccc61b9f6c3f39a9737" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 3606528 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.bias", @@ -6081,61 +5576,39 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3817472 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.weight", "shape": [ 1024, - 104 + 1024 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 3819520 + "nbytes": 2097152, + "byteOffset": 8390656 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 4245504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.bias", "shape": [ 1024 ], "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4298752 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 4300800 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 4726784 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.bias", @@ -6145,29 +5618,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4780032 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 4782080 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5208064 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.bias", @@ -6177,29 +5639,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5261312 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5263360 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5689344 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.bias", @@ -6209,7 +5660,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5742592 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.weight", @@ -6219,7 +5670,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5744640 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.bias", @@ -6229,7 +5680,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5746688 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.weight", @@ -6239,7 +5690,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5748736 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.bias", @@ -6249,29 +5700,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 5750784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 5758976 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 7462912 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.bias", @@ -6281,29 +5721,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7675904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 7677952 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "a7f57fd25793b85aa6027a514efc39fb" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 9365504 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.bias", @@ -6313,29 +5750,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9576448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 9578496 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 10004480 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.bias", @@ -6345,29 +5771,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10057728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 10059776 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 10485760 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.bias", @@ -6377,29 +5792,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10539008 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 10541056 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 10967040 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.bias", @@ -6409,29 +5813,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11020288 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11022336 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11448320 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.bias", @@ -6441,7 +5834,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11501568 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.weight", @@ -6451,7 +5844,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11503616 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.bias", @@ -6461,7 +5854,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11505664 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.weight", @@ -6471,7 +5864,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11507712 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.bias", @@ -6481,29 +5874,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 11509760 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 11517952 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 13221888 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.bias", @@ -6513,29 +5895,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13434880 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 13436928 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e13228942bc433e638fe3903001715f3" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 15124480 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.bias", @@ -6545,29 +5924,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15335424 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 15337472 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 15763456 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.bias", @@ -6577,29 +5945,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15816704 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 15818752 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 16244736 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.bias", @@ -6609,29 +5966,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16297984 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16300032 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 16726016 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.bias", @@ -6641,29 +5987,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16779264 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16781312 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17207296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.bias", @@ -6673,7 +6008,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17260544 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.weight", @@ -6683,7 +6018,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17262592 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.bias", @@ -6693,7 +6028,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17264640 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.weight", @@ -6703,7 +6038,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17266688 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.bias", @@ -6713,29 +6048,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 17268736 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 17276928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 18980864 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.bias", @@ -6745,29 +6069,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19193856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 19195904 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "eab0a6fc1a1e3beac991a0be01fdefe8" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 20883456 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.bias", @@ -6777,29 +6098,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21094400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 21096448 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 21522432 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.bias", @@ -6809,29 +6119,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21575680 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 21577728 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22003712 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.bias", @@ -6841,29 +6140,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22056960 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22059008 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22484992 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.bias", @@ -6873,29 +6161,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22538240 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22540288 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22966272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.bias", @@ -6905,7 +6182,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23019520 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.weight", @@ -6915,7 +6192,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23021568 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.bias", @@ -6925,7 +6202,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23023616 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.weight", @@ -6935,7 +6212,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23025664 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.bias", @@ -6945,29 +6222,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 23027712 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 23035904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 24739840 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.bias", @@ -6977,29 +6243,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24952832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 24954880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "afcfd0263f305fcc63e7b86393753bf7" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 26642432 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.bias", @@ -7009,29 +6272,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26853376 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 26855424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 27281408 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.bias", @@ -7041,29 +6293,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27334656 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 27336704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 27762688 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.bias", @@ -7073,29 +6314,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27815936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 27817984 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28243968 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.bias", @@ -7105,29 +6335,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28297216 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28299264 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28725248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.bias", @@ -7137,7 +6356,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28778496 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.weight", @@ -7147,7 +6366,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28780544 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.bias", @@ -7157,7 +6376,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28782592 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.weight", @@ -7167,7 +6386,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28784640 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.bias", @@ -7177,29 +6396,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 28786688 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 28794880 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 30498816 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.bias", @@ -7209,29 +6417,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30711808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 30713856 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "460a8bc76edf812f85886ec9f950f395" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 32401408 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.bias", @@ -7241,29 +6446,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32612352 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 32614400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 33040384 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.bias", @@ -7273,37 +6467,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33093632 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 33095680 - } - ], - "md5sum": "c24f2e57d8e79878e359cf6ab34d1bee" - }, - { - "dataPath": "params_shard_68.bin", - "format": "raw-shard", - "nbytes": 33433600, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 0 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.bias", @@ -7313,29 +6488,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 53248 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 55296 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 481280 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.bias", @@ -7345,29 +6509,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 534528 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 536576 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 962560 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.bias", @@ -7377,7 +6530,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1015808 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.weight", @@ -7387,7 +6540,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1017856 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.bias", @@ -7397,7 +6550,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1019904 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.weight", @@ -7407,7 +6560,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1021952 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.bias", @@ -7417,29 +6570,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 1024000 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 1032192 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 2736128 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.bias", @@ -7449,29 +6591,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2949120 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 2951168 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "bcac984764bba0a4eb9891d2043e1d89" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 4638720 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.bias", @@ -7481,29 +6620,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4849664 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 4851712 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5277696 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.bias", @@ -7513,29 +6641,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5330944 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5332992 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5758976 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.bias", @@ -7545,29 +6662,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5812224 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5814272 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6240256 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.bias", @@ -7577,29 +6683,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6293504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 6295552 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6721536 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.bias", @@ -7609,7 +6704,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6774784 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.weight", @@ -7619,7 +6714,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6776832 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.bias", @@ -7629,7 +6724,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6778880 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.weight", @@ -7639,7 +6734,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6780928 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.bias", @@ -7649,29 +6744,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 6782976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 6791168 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 8495104 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.bias", @@ -7681,29 +6765,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8708096 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 8710144 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "3197e582d745d84c2ab4347a1f2d4e2d" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 10397696 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.bias", @@ -7713,29 +6794,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10608640 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 10610688 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11036672 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.bias", @@ -7745,29 +6815,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11089920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11091968 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11517952 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.bias", @@ -7777,29 +6836,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11571200 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11573248 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11999232 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.bias", @@ -7809,29 +6857,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12052480 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 12054528 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 12480512 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.bias", @@ -7841,7 +6878,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12533760 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.weight", @@ -7851,7 +6888,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12535808 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.bias", @@ -7861,7 +6898,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12537856 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.weight", @@ -7871,7 +6908,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12539904 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.bias", @@ -7881,29 +6918,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 12541952 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 12550144 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 14254080 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.bias", @@ -7913,29 +6939,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14467072 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 14469120 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e6d67ae9f4dab5ea49fac79bceac7a86" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 16156672 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.bias", @@ -7945,29 +6968,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16367616 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16369664 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 16795648 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.bias", @@ -7977,29 +6989,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16848896 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16850944 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17276928 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.bias", @@ -8009,29 +7010,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17330176 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17332224 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17758208 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.bias", @@ -8041,29 +7031,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17811456 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17813504 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 18239488 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.bias", @@ -8073,7 +7052,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18292736 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.weight", @@ -8083,7 +7062,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18294784 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.bias", @@ -8093,7 +7072,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18296832 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.weight", @@ -8103,7 +7082,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18298880 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.bias", @@ -8113,29 +7092,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18300928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 18309120 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 20013056 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.bias", @@ -8145,29 +7113,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20226048 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 20228096 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "1a74510bf14d6fc06b53f09ee6a22fdd" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 21915648 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.bias", @@ -8177,29 +7142,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22126592 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22128640 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22554624 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.bias", @@ -8209,29 +7163,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22607872 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22609920 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23035904 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.bias", @@ -8241,29 +7184,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23089152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23091200 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23517184 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.bias", @@ -8273,29 +7205,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23570432 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23572480 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23998464 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.bias", @@ -8305,7 +7226,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24051712 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.weight", @@ -8315,7 +7236,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24053760 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.bias", @@ -8325,7 +7246,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24055808 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.weight", @@ -8335,7 +7256,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24057856 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.bias", @@ -8345,29 +7266,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 24059904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 24068096 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 25772032 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.bias", @@ -8377,29 +7287,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25985024 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 25987072 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "75a9ee23e852e5562e2176a5ece04f24" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 27674624 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.bias", @@ -8409,29 +7316,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27885568 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 27887616 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28313600 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.bias", @@ -8441,29 +7337,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28366848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28368896 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28794880 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.bias", @@ -8473,29 +7358,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28848128 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28850176 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29276160 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.bias", @@ -8505,29 +7379,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29329408 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 29331456 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29757440 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.bias", @@ -8537,7 +7400,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29810688 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.weight", @@ -8547,7 +7410,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29812736 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.bias", @@ -8557,7 +7420,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29814784 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.weight", @@ -8567,7 +7430,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29816832 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.bias", @@ -8577,29 +7440,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 29818880 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 29827072 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 31531008 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.bias", @@ -8609,36 +7461,25 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31744000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 31746048 + "byteOffset": 25190400 } ], - "md5sum": "a2dadce37a87f77e5bc03f6942019c7b" + "md5sum": "da3f4d64dad38aa57a47fd6fbca1a334" }, { - "dataPath": "params_shard_69.bin", + "dataPath": "params_shard_85.bin", "format": "raw-shard", - "nbytes": 30887936, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, + "nbytes": 8388608, "byteOffset": 0 }, { @@ -8649,29 +7490,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 210944 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 212992 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 638976 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.bias", @@ -8681,61 +7511,39 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 692224 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 694272 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 1120256 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.bias", "shape": [ 1024 ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 1173504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 1175552 + "nbytes": 2048, + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 1601536 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.bias", @@ -8745,29 +7553,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1654784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 1656832 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 2082816 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.bias", @@ -8777,7 +7574,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2136064 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.weight", @@ -8787,7 +7584,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2138112 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.bias", @@ -8797,7 +7594,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2140160 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.weight", @@ -8807,7 +7604,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2142208 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.bias", @@ -8817,29 +7614,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 2144256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 2152448 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 3856384 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.bias", @@ -8849,29 +7635,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4069376 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 4071424 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "ca1eb7481171d37cc9fab4b3432d81d1" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 5758976 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.bias", @@ -8881,29 +7664,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5969920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5971968 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6397952 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.bias", @@ -8913,29 +7685,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6451200 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 6453248 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6879232 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.bias", @@ -8945,29 +7706,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6932480 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 6934528 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 7360512 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.bias", @@ -8977,29 +7727,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7413760 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 7415808 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 7841792 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.bias", @@ -9009,7 +7748,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7895040 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.weight", @@ -9019,7 +7758,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7897088 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.bias", @@ -9029,7 +7768,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7899136 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.weight", @@ -9039,7 +7778,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7901184 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.bias", @@ -9049,29 +7788,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 7903232 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 7911424 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 9615360 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.bias", @@ -9081,29 +7809,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9828352 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 9830400 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "03be4317a6855a15625866d5dde56763" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 11517952 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.bias", @@ -9113,29 +7838,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11728896 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11730944 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 12156928 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.bias", @@ -9145,29 +7859,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12210176 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 12212224 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 12638208 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.bias", @@ -9177,29 +7880,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12691456 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 12693504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 13119488 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.bias", @@ -9209,29 +7901,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13172736 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 13174784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 13600768 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.bias", @@ -9241,7 +7922,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13654016 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.weight", @@ -9251,7 +7932,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13656064 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.bias", @@ -9261,7 +7942,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13658112 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.weight", @@ -9271,7 +7952,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13660160 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.bias", @@ -9281,29 +7962,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 13662208 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 13670400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 15374336 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.bias", @@ -9313,29 +7983,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15587328 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 15589376 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "7464cccd529310def6e3920c637ad62c" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 17276928 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.bias", @@ -9345,29 +8012,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17487872 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17489920 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17915904 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.bias", @@ -9377,29 +8033,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17969152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17971200 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 18397184 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.bias", @@ -9409,29 +8054,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18450432 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 18452480 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 18878464 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.bias", @@ -9441,29 +8075,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18931712 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 18933760 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 19359744 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.bias", @@ -9473,7 +8096,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19412992 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.weight", @@ -9483,7 +8106,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19415040 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.bias", @@ -9493,7 +8116,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19417088 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.weight", @@ -9503,7 +8126,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19419136 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.bias", @@ -9513,29 +8136,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 19421184 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 19429376 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 21133312 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.bias", @@ -9545,29 +8157,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21346304 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 21348352 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "8be48481c922751c9b723a99e5dcd727" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 26767360, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 23035904 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.bias", @@ -9577,29 +8186,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23246848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23248896 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23674880 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.bias", @@ -9609,29 +8207,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23728128 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23730176 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 24156160 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.bias", @@ -9641,29 +8228,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24209408 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 24211456 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 24637440 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.bias", @@ -9673,29 +8249,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24690688 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 24692736 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 25118720 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.bias", @@ -9705,7 +8270,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25171968 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.weight", @@ -9715,7 +8280,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25174016 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.bias", @@ -9725,7 +8290,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25176064 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.weight", @@ -9735,7 +8300,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25178112 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_projection.linear_1.bias", @@ -9745,7 +8310,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 25180160 + "byteOffset": 16793600 }, { "name": "vision_embed_tokens.img_projection.linear_1.q_weight", @@ -9756,7 +8321,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 5062656, - "byteOffset": 25186304 + "byteOffset": 16799744 }, { "name": "vision_embed_tokens.img_projection.linear_1.q_scale", @@ -9767,7 +8332,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 632832, - "byteOffset": 30248960 + "byteOffset": 21862400 }, { "name": "vision_embed_tokens.img_projection.linear_2.bias", @@ -9777,16 +8342,8 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 30881792 - } - ], - "md5sum": "96daef3567f9842251bb425924ac75a3" - }, - { - "dataPath": "params_shard_70.bin", - "format": "raw-shard", - "nbytes": 4265984, - "records": [ + "byteOffset": 22495232 + }, { "name": "vision_embed_tokens.img_projection.linear_2.q_weight", "shape": [ @@ -9796,7 +8353,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 3784704, - "byteOffset": 0 + "byteOffset": 22501376 }, { "name": "vision_embed_tokens.img_projection.linear_2.q_scale", @@ -9807,7 +8364,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 473088, - "byteOffset": 3784704 + "byteOffset": 26286080 }, { "name": "vision_embed_tokens.sub_GN", @@ -9820,10 +8377,10 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 4257792 + "byteOffset": 26759168 } ], - "md5sum": "ebe2947681e943d49c3e4fa08218992a" + "md5sum": "91fb7eb9ed733756ed0c89a04c1a2657" } ] } \ No newline at end of file