diff --git a/mlc-chat-config.json b/mlc-chat-config.json index c807d1f58efa0325f8bb5e99f452664900ff4e6f..6e7ffaa9f6e84471e9e5fa289b229a631df36730 100644 --- a/mlc-chat-config.json +++ b/mlc-chat-config.json @@ -140,15 +140,15 @@ }, "original_max_position_embeddings": 4096, "context_window_size": 131072, - "prefill_chunk_size": 2048, + "prefill_chunk_size": 8192, "head_dim": 96, "tensor_parallel_shards": 1, - "max_batch_size": 80 + "max_batch_size": 128 }, "vocab_size": 32064, "context_window_size": 131072, "sliding_window_size": -1, - "prefill_chunk_size": 2048, + "prefill_chunk_size": 8192, "attention_sink_size": -1, "tensor_parallel_shards": 1, "pipeline_parallel_stages": 1, diff --git a/ndarray-cache.json b/ndarray-cache.json index d41ca24ddd04164f0d8591db23f3cc8a448f901e..3a436a95f1bff5fa0249af3c958a2b29bb9d1f78 100644 --- a/ndarray-cache.json +++ b/ndarray-cache.json @@ -1,8 +1,8 @@ { "metadata": { - "ParamSize": 869, - "ParamBytes": 1873364948.0, - "BitsPerParam": 3.7021917590823534 + "ParamSize": 724, + "ParamBytes": 2340679936.0, + "BitsPerParam": 4.625711599312261 }, "records": [ { @@ -22,7 +22,7 @@ "byteOffset": 0 } ], - "md5sum": "8a35ddbbc2ab05256c6c2d54d6094fda" + "md5sum": "d7e1c53f4ed3388ab3651a4ac7fe5c3b" }, { "dataPath": "params_shard_1.bin", @@ -41,7 +41,7 @@ "byteOffset": 0 } ], - "md5sum": "5e643ec4c20f60ffaeae2a841566cd75" + "md5sum": "bbe371e4c6556993e74003d072d5a519" }, { "dataPath": "params_shard_2.bin", @@ -145,7 +145,7 @@ "byteOffset": 31582336 } ], - "md5sum": "24fab578168aeadbc9559a578c7183e7" + "md5sum": "8eb6f7a52bf759728f53f0245c72a859" }, { "dataPath": "params_shard_3.bin", @@ -186,7 +186,7 @@ "byteOffset": 11335680 } ], - "md5sum": "419b98c8f9ad7d166c3979d8d9c7559b" + "md5sum": "2ba63895330a62bc1318c87c5d5072ce" }, { "dataPath": "params_shard_4.bin", @@ -205,7 +205,7 @@ "byteOffset": 0 } ], - "md5sum": "1664118860d52dd98f030f503f04ad24" + "md5sum": "9456eef90ffdc61e81ffe0800109e762" }, { "dataPath": "params_shard_5.bin", @@ -331,7 +331,7 @@ "byteOffset": 33425408 } ], - "md5sum": "c2a46d96f42d25691193feaf4dfdb7f2" + "md5sum": "cd6b9aa2b41c2140645eefb808a8a2e3" }, { "dataPath": "params_shard_6.bin", @@ -350,7 +350,7 @@ "byteOffset": 0 } ], - "md5sum": "5a0644c2a7b96ecc7f44db61c76980b1" + "md5sum": "4ec6c96f6227fce6dbe6a251dad201f3" }, { "dataPath": "params_shard_7.bin", @@ -455,7 +455,7 @@ "byteOffset": 30896128 } ], - "md5sum": "e207ed95b32cf79cd2023cf0ec11d8c7" + "md5sum": "30f769a15fbdac43ca45e6812ffecbfb" }, { "dataPath": "params_shard_8.bin", @@ -474,7 +474,7 @@ "byteOffset": 0 } ], - "md5sum": "f4302a88dfb0c1dd8f39023f158eecb1" + "md5sum": "3e20b5efdce2e340dbb820d88b3cb7e0" }, { "dataPath": "params_shard_9.bin", @@ -579,7 +579,7 @@ "byteOffset": 30896128 } ], - "md5sum": "526c77bf2a28ad9f696f99d2f36324b5" + "md5sum": "5bbad59fbf3fd94682eb75a071e0f264" }, { "dataPath": "params_shard_10.bin", @@ -598,7 +598,7 @@ "byteOffset": 0 } ], - "md5sum": "7d502dc51f0b4ba087038840e2e3fa2a" + "md5sum": "5c710bda058fe56ce812112e1b0f0ee0" }, { "dataPath": "params_shard_11.bin", @@ -703,7 +703,7 @@ "byteOffset": 30896128 } ], - "md5sum": "40b08c6e4a04c85dcc8d20763a131aaa" + "md5sum": "7a15e2962ed42b63453eaecd837ff275" }, { "dataPath": "params_shard_12.bin", @@ -722,7 +722,7 @@ "byteOffset": 0 } ], - "md5sum": "ad0c16081945fd54ca9d5bf88322cf6e" + "md5sum": "0a10e859199899afd04e346c84ef3eef" }, { "dataPath": "params_shard_13.bin", @@ -827,7 +827,7 @@ "byteOffset": 30896128 } ], - "md5sum": "ff97580cc8b519c9a0dafbec95ce9076" + "md5sum": "6bc76013f6066d9569517976841883eb" }, { "dataPath": "params_shard_14.bin", @@ -846,7 +846,7 @@ "byteOffset": 0 } ], - "md5sum": "900c18766113eff094153343f44eae68" + "md5sum": "f734322260c53272938e682d4441e076" }, { "dataPath": "params_shard_15.bin", @@ -951,7 +951,7 @@ "byteOffset": 30896128 } ], - "md5sum": "354d4710d313309d24b60d9dc0d7de86" + "md5sum": "ad714acba2104718fb5491a432b197d1" }, { "dataPath": "params_shard_16.bin", @@ -970,7 +970,7 @@ "byteOffset": 0 } ], - "md5sum": "375e40a711c06214bcf155207c27c8df" + "md5sum": "348d7841fb570d2dc49bbb93d3679134" }, { "dataPath": "params_shard_17.bin", @@ -1075,7 +1075,7 @@ "byteOffset": 30896128 } ], - "md5sum": "2a08f7bdb8837cf2659d8d2d62b47cfb" + "md5sum": "6179ab639c1bda89b3c90cb50ae11762" }, { "dataPath": "params_shard_18.bin", @@ -1094,7 +1094,7 @@ "byteOffset": 0 } ], - "md5sum": "02e503ff2aa0900aa47e73d0b85ef80d" + "md5sum": "336989816dd64c49e7eadbdea61ca170" }, { "dataPath": "params_shard_19.bin", @@ -1199,7 +1199,7 @@ "byteOffset": 30896128 } ], - "md5sum": "089a8975a68756edba36ba294c67a8ef" + "md5sum": "da3b6c34fb6d830d6245f9c61818a068" }, { "dataPath": "params_shard_20.bin", @@ -1218,7 +1218,7 @@ "byteOffset": 0 } ], - "md5sum": "e55ee3c00cc9b2fc5db22c815ed1e35f" + "md5sum": "0640e92aa128f4e05a58d7c5cc356006" }, { "dataPath": "params_shard_21.bin", @@ -1323,7 +1323,7 @@ "byteOffset": 30896128 } ], - "md5sum": "f3478b8fbcd86f16cec0803918d5e3ec" + "md5sum": "db3317dfde5ff5e937017d05543c3792" }, { "dataPath": "params_shard_22.bin", @@ -1342,7 +1342,7 @@ "byteOffset": 0 } ], - "md5sum": "2d47274575a56cc29842d9f9413d801c" + "md5sum": "0e9f6c20144e7d9da545ac535987d49c" }, { "dataPath": "params_shard_23.bin", @@ -1447,7 +1447,7 @@ "byteOffset": 30896128 } ], - "md5sum": "6871519612a4b73c0d24e2b32bcfb785" + "md5sum": "5cd3f1298c7d3e2eba61c2dccaa51fa1" }, { "dataPath": "params_shard_24.bin", @@ -1466,7 +1466,7 @@ "byteOffset": 0 } ], - "md5sum": "b90a3c96a5a1207a3574ae02a48669ef" + "md5sum": "1d625599633f2e8fdd20ea38072c1a3a" }, { "dataPath": "params_shard_25.bin", @@ -1571,7 +1571,7 @@ "byteOffset": 30896128 } ], - "md5sum": "bd8f516641f37b8ab8fdfbf5341150d7" + "md5sum": "430a7c4d1d69396f3ec1eb880b7f716f" }, { "dataPath": "params_shard_26.bin", @@ -1590,7 +1590,7 @@ "byteOffset": 0 } ], - "md5sum": "5cad5fb8c628578200af5174a42c330d" + "md5sum": "25077b71bded2893f97467c767447e8f" }, { "dataPath": "params_shard_27.bin", @@ -1695,7 +1695,7 @@ "byteOffset": 30896128 } ], - "md5sum": "3aabdc1f95147e394d5de5df9697ef2b" + "md5sum": "2239b285a54e01bb80bccbf22c562d3f" }, { "dataPath": "params_shard_28.bin", @@ -1714,7 +1714,7 @@ "byteOffset": 0 } ], - "md5sum": "381023fb23574049257f2a0eec9b554f" + "md5sum": "5e7537fcb657900a598019c4ea92dc0a" }, { "dataPath": "params_shard_29.bin", @@ -1733,7 +1733,7 @@ "byteOffset": 0 } ], - "md5sum": "b05a8053cb19739cf76c4d5e303b95ed" + "md5sum": "8409accc0efa14b9bd2212b965b6d449" }, { "dataPath": "params_shard_30.bin", @@ -1838,7 +1838,7 @@ "byteOffset": 32057472 } ], - "md5sum": "55427a0d100d982af219140f2f1b3b19" + "md5sum": "897b4fd728d5eaf06f7e5e8eb9fff479" }, { "dataPath": "params_shard_31.bin", @@ -1857,7 +1857,7 @@ "byteOffset": 0 } ], - "md5sum": "655b2041eb3bc532b2f76f8a3044a80e" + "md5sum": "d3bc8dfb66a961ed8ff8d82d62f891e6" }, { "dataPath": "params_shard_32.bin", @@ -1983,7 +1983,7 @@ "byteOffset": 33425408 } ], - "md5sum": "60597c76e7ae98d8687f3ef6d24ef84d" + "md5sum": "9fa4180ca7f3d8d2671e424df58f7d33" }, { "dataPath": "params_shard_33.bin", @@ -2002,7 +2002,7 @@ "byteOffset": 0 } ], - "md5sum": "3beb4e5859d4d77a395a9cfcda94fd21" + "md5sum": "a3f57885456413befe772a61db9fe003" }, { "dataPath": "params_shard_34.bin", @@ -2107,7 +2107,7 @@ "byteOffset": 30896128 } ], - "md5sum": "a5a2e49eb5e992f4a4da8593a0e32c46" + "md5sum": "939e4d0a910d890d33ab3aa4cfae6527" }, { "dataPath": "params_shard_35.bin", @@ -2126,7 +2126,7 @@ "byteOffset": 0 } ], - "md5sum": "a5ee83fb741c7a33c7e86784d9be28d6" + "md5sum": "ba8cc1009d70aa580a3c3464ddcf2e1b" }, { "dataPath": "params_shard_36.bin", @@ -2231,7 +2231,7 @@ "byteOffset": 30896128 } ], - "md5sum": "8b09bdf75eba6d273336c78223a3fbac" + "md5sum": "cf73ece61d143b5685eef41c20229c42" }, { "dataPath": "params_shard_37.bin", @@ -2250,7 +2250,7 @@ "byteOffset": 0 } ], - "md5sum": "a3b6820d889f86491595e7c64a292346" + "md5sum": "62f2abbb1faa52d0bce9d55753794a88" }, { "dataPath": "params_shard_38.bin", @@ -2355,7 +2355,7 @@ "byteOffset": 30896128 } ], - "md5sum": "2cf21a5ab798e9a8424ba6c8d4475414" + "md5sum": "d2acdc47a3bc43aa505032d2bb8c15f3" }, { "dataPath": "params_shard_39.bin", @@ -2374,7 +2374,7 @@ "byteOffset": 0 } ], - "md5sum": "f4ab43131aa9a0ffee3815b901dc8591" + "md5sum": "bb5529cdb10895082d3b2e5293f6d1cd" }, { "dataPath": "params_shard_40.bin", @@ -2479,7 +2479,7 @@ "byteOffset": 30896128 } ], - "md5sum": "c0cb92677fedc090b87887989db52c5b" + "md5sum": "98ef5b4e63d4701a25201cdc3c05bf12" }, { "dataPath": "params_shard_41.bin", @@ -2498,7 +2498,7 @@ "byteOffset": 0 } ], - "md5sum": "0756b15ae5e75580f8a9f33f62914dda" + "md5sum": "24522563518632d9a17f4166066cb200" }, { "dataPath": "params_shard_42.bin", @@ -2603,7 +2603,7 @@ "byteOffset": 30896128 } ], - "md5sum": "f7ec2b75978886fca92ba13a6a511bf0" + "md5sum": "8d3fab7847a5c022d510e83f15c23ad7" }, { "dataPath": "params_shard_43.bin", @@ -2622,7 +2622,7 @@ "byteOffset": 0 } ], - "md5sum": "67c0eba6afa7bead6674cbc479f6b5a7" + "md5sum": "215dc6ff0a1f211c3727dcc991c46cf1" }, { "dataPath": "params_shard_44.bin", @@ -2727,7 +2727,7 @@ "byteOffset": 30896128 } ], - "md5sum": "f67124710df92edb87263cc95ca70806" + "md5sum": "72866c136adefde27ba78274ed57619a" }, { "dataPath": "params_shard_45.bin", @@ -2746,7 +2746,7 @@ "byteOffset": 0 } ], - "md5sum": "db05762038bee40f53680fbf656b91da" + "md5sum": "7f02d5ccf7cc2c4370777d6ae00b1244" }, { "dataPath": "params_shard_46.bin", @@ -2851,7 +2851,7 @@ "byteOffset": 30896128 } ], - "md5sum": "939795fea6dc100035f9fc0a49d711b0" + "md5sum": "30abcca65e41086ad0667aacaf53384b" }, { "dataPath": "params_shard_47.bin", @@ -2870,7 +2870,7 @@ "byteOffset": 0 } ], - "md5sum": "f9fb91d66e9fca6030f1ae038d840f00" + "md5sum": "69a2467ff910a2811ef2c4542bc4fe56" }, { "dataPath": "params_shard_48.bin", @@ -2975,7 +2975,7 @@ "byteOffset": 30896128 } ], - "md5sum": "8ab8d33f317b9a6c5c60140793ff0fd3" + "md5sum": "a22c8fb5e9fed8eeee2e25e97eebabaa" }, { "dataPath": "params_shard_49.bin", @@ -2994,7 +2994,7 @@ "byteOffset": 0 } ], - "md5sum": "d02c9a6a3e469a42b7727dcbe8da5372" + "md5sum": "de1a4314be8c30ee24e9f222493b0f5b" }, { "dataPath": "params_shard_50.bin", @@ -3100,7 +3100,7 @@ "byteOffset": 31371264 } ], - "md5sum": "34bb78bf6f0142eae8fc499be2eae4a1" + "md5sum": "e236c8247a12c058d052abe0ae7fc877" }, { "dataPath": "params_shard_51.bin", @@ -3119,7 +3119,7 @@ "byteOffset": 0 } ], - "md5sum": "1b55a46a61b4c4c44d98239d787cf521" + "md5sum": "8d311f71a279bc57e82db1bfee4377e0" }, { "dataPath": "params_shard_52.bin", @@ -3245,7 +3245,7 @@ "byteOffset": 33425408 } ], - "md5sum": "8cdb1371166272e1a9084901fc4be2f2" + "md5sum": "64e85992e12b41d931b4135988285364" }, { "dataPath": "params_shard_53.bin", @@ -3264,7 +3264,7 @@ "byteOffset": 0 } ], - "md5sum": "8d9bb581a610c0f8253fb86edb63b3e7" + "md5sum": "c9311d3be9641447bf58117d7e8c58a7" }, { "dataPath": "params_shard_54.bin", @@ -3369,7 +3369,7 @@ "byteOffset": 30896128 } ], - "md5sum": "35b6c52919b02d23fcc4eb6c96fa3939" + "md5sum": "d621aecf6605c376c716c5740763cd54" }, { "dataPath": "params_shard_55.bin", @@ -3388,7 +3388,7 @@ "byteOffset": 0 } ], - "md5sum": "4fdd2e740eb529f99aa42517aff952e1" + "md5sum": "d3b2599308c53564ab04eb7c13b15fad" }, { "dataPath": "params_shard_56.bin", @@ -3493,7 +3493,7 @@ "byteOffset": 30896128 } ], - "md5sum": "34d8e5a154849d6cd0e80c3cbfeb415a" + "md5sum": "efdbce3b0bdac0012a5351dde276b4cc" }, { "dataPath": "params_shard_57.bin", @@ -3512,7 +3512,7 @@ "byteOffset": 0 } ], - "md5sum": "5424057c52fefadd949acaf659270b4f" + "md5sum": "5e4f4154f7e37074b030ef2ba84f99fe" }, { "dataPath": "params_shard_58.bin", @@ -3617,7 +3617,7 @@ "byteOffset": 30896128 } ], - "md5sum": "d9a4476ee91dcd2b8b4e1fc21e62e3ae" + "md5sum": "852443b009f7b915ac3d3b9058bd8473" }, { "dataPath": "params_shard_59.bin", @@ -3636,7 +3636,7 @@ "byteOffset": 0 } ], - "md5sum": "3c7dfad2b08f7f7286e527bb245d0c22" + "md5sum": "e7e25940d67c00c1b8d30e56ea7d5fd4" }, { "dataPath": "params_shard_60.bin", @@ -3741,7 +3741,7 @@ "byteOffset": 30896128 } ], - "md5sum": "021ced36e57a5c9c9c4799aaa95aa1b3" + "md5sum": "94d1dfa1be75385702998e301115055a" }, { "dataPath": "params_shard_61.bin", @@ -3760,7 +3760,7 @@ "byteOffset": 0 } ], - "md5sum": "15b1fe414b809a835331cb0688bd903f" + "md5sum": "4608f00654ceaa9953c3daccb281330b" }, { "dataPath": "params_shard_62.bin", @@ -3865,7 +3865,7 @@ "byteOffset": 30896128 } ], - "md5sum": "7b85b21a4f10e21933aa76f10079d7c6" + "md5sum": "9bd35cc0fed109dedcb6e04ff7d162d2" }, { "dataPath": "params_shard_63.bin", @@ -3884,7 +3884,7 @@ "byteOffset": 0 } ], - "md5sum": "80ffcfa1ab4cb04357f75e1fcd6d2018" + "md5sum": "5f3ccfc709639df0a73db5ee3a960fb7" }, { "dataPath": "params_shard_64.bin", @@ -3989,12 +3989,12 @@ "byteOffset": 30896128 } ], - "md5sum": "1a6d6b9b372685fc903858f709c330d3" + "md5sum": "ad1237b06fbd0528c9f8e23cf79a8891" }, { "dataPath": "params_shard_65.bin", "format": "raw-shard", - "nbytes": 31968980, + "nbytes": 27834368, "records": [ { "name": "model.h.9.mixer.out_proj.q_weight", @@ -4076,26 +4076,15 @@ "byteOffset": 17041408 }, { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.weight", "shape": [ 577, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 240032, - "byteOffset": 18245632 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_scale", - "shape": [ - 577, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 30004, - "byteOffset": 18485664 + "nbytes": 1181696, + "byteOffset": 18245632 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.bias", @@ -4105,7 +4094,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18515668 + "byteOffset": 19427328 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.weight", @@ -4115,7 +4104,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18517716 + "byteOffset": 19429376 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.bias", @@ -4125,7 +4114,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18519764 + "byteOffset": 19431424 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.weight", @@ -4135,7 +4124,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18521812 + "byteOffset": 19433472 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.bias", @@ -4145,29 +4134,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18523860 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 18532052 + "byteOffset": 19435520 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 20235988 + "nbytes": 8388608, + "byteOffset": 19443712 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.bias", @@ -4177,29 +4155,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20448980 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 20451028 - }, + "byteOffset": 27832320 + } + ], + "md5sum": "e9f4130276ed5535299d74f5e68e0597" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 22138580 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.bias", @@ -4209,29 +4184,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22349524 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22351572 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22777556 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.bias", @@ -4241,29 +4205,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22830804 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22832852 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23258836 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.bias", @@ -4273,29 +4226,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23312084 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23314132 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23740116 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.bias", @@ -4305,29 +4247,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23793364 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23795412 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 24221396 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.bias", @@ -4337,7 +4268,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24274644 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.weight", @@ -4347,7 +4278,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24276692 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.bias", @@ -4357,7 +4288,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24278740 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.weight", @@ -4367,7 +4298,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24280788 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.bias", @@ -4377,29 +4308,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 24282836 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 24291028 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 25994964 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.bias", @@ -4409,29 +4329,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26207956 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 26210004 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "12ccc3786467895471d31bb5b1d2610c" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 27897556 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.bias", @@ -4441,29 +4358,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28108500 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28110548 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28536532 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.bias", @@ -4473,29 +4379,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28589780 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28591828 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29017812 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.bias", @@ -4505,29 +4400,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29071060 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 29073108 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29499092 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.bias", @@ -4537,29 +4421,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29552340 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 29554388 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29980372 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.bias", @@ -4569,7 +4442,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30033620 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.weight", @@ -4579,7 +4452,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30035668 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.bias", @@ -4589,7 +4462,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30037716 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.weight", @@ -4599,7 +4472,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30039764 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.bias", @@ -4609,29 +4482,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 30041812 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 30050004 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 31753940 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.bias", @@ -4641,37 +4503,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31966932 + "byteOffset": 25190400 } ], - "md5sum": "50ec01b6812197d7e6a45c6f47b0dfe5" + "md5sum": "dcc2adf61aa07fe189bb15874110e845" }, { - "dataPath": "params_shard_66.bin", + "dataPath": "params_shard_68.bin", "format": "raw-shard", - "nbytes": 32634880, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 0 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 1687552 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.bias", @@ -4681,29 +4532,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1898496 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 1900544 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 2326528 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.bias", @@ -4713,29 +4553,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2379776 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 2381824 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 2807808 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.bias", @@ -4745,29 +4574,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2861056 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 2863104 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 3289088 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.bias", @@ -4777,29 +4595,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3342336 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 3344384 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 3770368 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.bias", @@ -4809,7 +4616,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3823616 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.weight", @@ -4819,7 +4626,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3825664 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.bias", @@ -4829,7 +4636,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3827712 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.weight", @@ -4839,7 +4646,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3829760 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.bias", @@ -4849,29 +4656,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 3831808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 3840000 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 5543936 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.bias", @@ -4881,29 +4677,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5756928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 5758976 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "9f8d49d8894a05f4179ba707925e9d59" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 7446528 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.bias", @@ -4913,29 +4706,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7657472 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 7659520 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 8085504 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.bias", @@ -4945,29 +4727,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8138752 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 8140800 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 8566784 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.bias", @@ -4977,29 +4748,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8620032 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 8622080 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 9048064 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.bias", @@ -5009,29 +4769,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9101312 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 9103360 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 9529344 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.bias", @@ -5041,7 +4790,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9582592 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.weight", @@ -5051,7 +4800,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9584640 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.bias", @@ -5061,7 +4810,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9586688 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.weight", @@ -5071,7 +4820,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9588736 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.bias", @@ -5081,29 +4830,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 9590784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 9598976 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 11302912 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.bias", @@ -5113,29 +4851,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11515904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 11517952 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "19b6f5d2cfc839108f9156b8b521d3ce" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 13205504 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.bias", @@ -5145,29 +4880,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13416448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 13418496 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 13844480 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.bias", @@ -5177,29 +4901,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13897728 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 13899776 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 14325760 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.bias", @@ -5209,29 +4922,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14379008 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 14381056 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 14807040 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.bias", @@ -5241,29 +4943,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14860288 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 14862336 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 15288320 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.bias", @@ -5273,7 +4964,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15341568 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.weight", @@ -5283,7 +4974,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15343616 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.bias", @@ -5293,7 +4984,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15345664 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.weight", @@ -5303,7 +4994,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15347712 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.bias", @@ -5313,29 +5004,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 15349760 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 15357952 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 17061888 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.bias", @@ -5345,29 +5025,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17274880 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 17276928 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "3e6322c0673873144d67964c709fa3be" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 18964480 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.bias", @@ -5377,29 +5054,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19175424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 19177472 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 19603456 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.bias", @@ -5409,29 +5075,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19656704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 19658752 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 20084736 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.bias", @@ -5441,29 +5096,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20137984 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 20140032 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 20566016 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.bias", @@ -5473,29 +5117,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20619264 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 20621312 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 21047296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.bias", @@ -5505,7 +5138,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21100544 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.weight", @@ -5515,7 +5148,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21102592 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.bias", @@ -5525,7 +5158,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21104640 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.weight", @@ -5535,7 +5168,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21106688 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.bias", @@ -5545,29 +5178,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 21108736 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 21116928 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 22820864 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.bias", @@ -5577,29 +5199,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23033856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 23035904 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "f04370015a40ae2073f5d89ad86f1c42" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 24723456 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.bias", @@ -5609,29 +5228,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24934400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 24936448 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 25362432 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.bias", @@ -5641,29 +5249,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25415680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 25417728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 25843712 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.bias", @@ -5673,29 +5270,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25896960 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 25899008 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 26324992 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.bias", @@ -5705,29 +5291,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26378240 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 26380288 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 26806272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.bias", @@ -5737,7 +5312,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26859520 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.weight", @@ -5747,7 +5322,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26861568 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.bias", @@ -5757,7 +5332,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26863616 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.weight", @@ -5767,7 +5342,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26865664 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.bias", @@ -5777,29 +5352,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 26867712 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 26875904 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 28579840 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.bias", @@ -5809,29 +5373,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28792832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 28794880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e2c99d455ee851ede30d282481166453" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 30482432 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.bias", @@ -5841,29 +5402,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30693376 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 30695424 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 31121408 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.bias", @@ -5873,29 +5423,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31174656 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 31176704 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 31602688 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.bias", @@ -5905,29 +5444,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31655936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 31657984 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 32083968 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.bias", @@ -5937,29 +5465,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32137216 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 32139264 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 32565248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.bias", @@ -5969,7 +5486,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32618496 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.weight", @@ -5979,7 +5496,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32620544 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.bias", @@ -5989,7 +5506,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32622592 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.weight", @@ -5999,7 +5516,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32624640 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.bias", @@ -6009,37 +5526,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 32626688 - } - ], - "md5sum": "81c15ab7a906dcc39b7bf83864d4b44f" - }, - { - "dataPath": "params_shard_67.bin", - "format": "raw-shard", - "nbytes": 33521664, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 0 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 1703936 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.bias", @@ -6049,29 +5547,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1916928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 1918976 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "11c75f74757caccc61b9f6c3f39a9737" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 3606528 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.bias", @@ -6081,61 +5576,39 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3817472 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.weight", "shape": [ 1024, - 104 + 1024 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 3819520 + "nbytes": 2097152, + "byteOffset": 8390656 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 4245504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.bias", "shape": [ 1024 ], "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4298752 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 4300800 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 4726784 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.bias", @@ -6145,29 +5618,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4780032 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 4782080 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5208064 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.bias", @@ -6177,29 +5639,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5261312 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5263360 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5689344 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.bias", @@ -6209,7 +5660,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5742592 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.weight", @@ -6219,7 +5670,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5744640 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.bias", @@ -6229,7 +5680,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5746688 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.weight", @@ -6239,7 +5690,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5748736 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.bias", @@ -6249,29 +5700,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 5750784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 5758976 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 7462912 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.bias", @@ -6281,29 +5721,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7675904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 7677952 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "a7f57fd25793b85aa6027a514efc39fb" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 9365504 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.bias", @@ -6313,29 +5750,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9576448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 9578496 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 10004480 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.bias", @@ -6345,29 +5771,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10057728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 10059776 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 10485760 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.bias", @@ -6377,29 +5792,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10539008 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 10541056 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 10967040 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.bias", @@ -6409,29 +5813,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11020288 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11022336 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11448320 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.bias", @@ -6441,7 +5834,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11501568 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.weight", @@ -6451,7 +5844,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11503616 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.bias", @@ -6461,7 +5854,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11505664 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.weight", @@ -6471,7 +5864,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11507712 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.bias", @@ -6481,29 +5874,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 11509760 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 11517952 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 13221888 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.bias", @@ -6513,29 +5895,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13434880 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 13436928 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e13228942bc433e638fe3903001715f3" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 15124480 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.bias", @@ -6545,29 +5924,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15335424 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 15337472 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 15763456 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.bias", @@ -6577,29 +5945,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15816704 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 15818752 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 16244736 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.bias", @@ -6609,29 +5966,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16297984 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16300032 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 16726016 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.bias", @@ -6641,29 +5987,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16779264 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16781312 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17207296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.bias", @@ -6673,7 +6008,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17260544 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.weight", @@ -6683,7 +6018,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17262592 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.bias", @@ -6693,7 +6028,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17264640 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.weight", @@ -6703,7 +6038,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17266688 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.bias", @@ -6713,29 +6048,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 17268736 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 17276928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 18980864 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.bias", @@ -6745,29 +6069,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19193856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 19195904 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "eab0a6fc1a1e3beac991a0be01fdefe8" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 20883456 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.bias", @@ -6777,29 +6098,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21094400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 21096448 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 21522432 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.bias", @@ -6809,29 +6119,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21575680 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 21577728 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22003712 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.bias", @@ -6841,29 +6140,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22056960 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22059008 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22484992 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.bias", @@ -6873,29 +6161,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22538240 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22540288 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22966272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.bias", @@ -6905,7 +6182,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23019520 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.weight", @@ -6915,7 +6192,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23021568 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.bias", @@ -6925,7 +6202,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23023616 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.weight", @@ -6935,7 +6212,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23025664 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.bias", @@ -6945,29 +6222,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 23027712 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 23035904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 24739840 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.bias", @@ -6977,29 +6243,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24952832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 24954880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "afcfd0263f305fcc63e7b86393753bf7" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 26642432 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.bias", @@ -7009,29 +6272,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26853376 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 26855424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 27281408 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.bias", @@ -7041,29 +6293,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27334656 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 27336704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 27762688 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.bias", @@ -7073,29 +6314,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27815936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 27817984 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28243968 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.bias", @@ -7105,29 +6335,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28297216 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28299264 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28725248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.bias", @@ -7137,7 +6356,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28778496 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.weight", @@ -7147,7 +6366,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28780544 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.bias", @@ -7157,7 +6376,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28782592 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.weight", @@ -7167,7 +6386,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28784640 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.bias", @@ -7177,29 +6396,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 28786688 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 28794880 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 30498816 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.bias", @@ -7209,29 +6417,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30711808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 30713856 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "460a8bc76edf812f85886ec9f950f395" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 32401408 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.bias", @@ -7241,29 +6446,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32612352 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 32614400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 33040384 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.bias", @@ -7273,37 +6467,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33093632 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 33095680 - } - ], - "md5sum": "c24f2e57d8e79878e359cf6ab34d1bee" - }, - { - "dataPath": "params_shard_68.bin", - "format": "raw-shard", - "nbytes": 33433600, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 0 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.bias", @@ -7313,29 +6488,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 53248 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 55296 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 481280 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.bias", @@ -7345,29 +6509,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 534528 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 536576 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 962560 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.bias", @@ -7377,7 +6530,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1015808 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.weight", @@ -7387,7 +6540,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1017856 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.bias", @@ -7397,7 +6550,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1019904 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.weight", @@ -7407,7 +6560,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1021952 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.bias", @@ -7417,29 +6570,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 1024000 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 1032192 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 2736128 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.bias", @@ -7449,29 +6591,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2949120 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 2951168 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "bcac984764bba0a4eb9891d2043e1d89" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 4638720 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.bias", @@ -7481,29 +6620,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4849664 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 4851712 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5277696 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.bias", @@ -7513,29 +6641,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5330944 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5332992 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 5758976 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.bias", @@ -7545,29 +6662,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5812224 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5814272 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6240256 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.bias", @@ -7577,29 +6683,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6293504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 6295552 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6721536 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.bias", @@ -7609,7 +6704,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6774784 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.weight", @@ -7619,7 +6714,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6776832 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.bias", @@ -7629,7 +6724,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6778880 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.weight", @@ -7639,7 +6734,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6780928 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.bias", @@ -7649,29 +6744,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 6782976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 6791168 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 8495104 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.bias", @@ -7681,29 +6765,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8708096 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 8710144 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "3197e582d745d84c2ab4347a1f2d4e2d" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 10397696 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.bias", @@ -7713,29 +6794,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10608640 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 10610688 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11036672 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.bias", @@ -7745,29 +6815,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11089920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11091968 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11517952 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.bias", @@ -7777,29 +6836,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11571200 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11573248 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 11999232 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.bias", @@ -7809,29 +6857,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12052480 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 12054528 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 12480512 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.bias", @@ -7841,7 +6878,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12533760 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.weight", @@ -7851,7 +6888,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12535808 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.bias", @@ -7861,7 +6898,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12537856 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.weight", @@ -7871,7 +6908,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12539904 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.bias", @@ -7881,29 +6918,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 12541952 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 12550144 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 14254080 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.bias", @@ -7913,29 +6939,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14467072 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 14469120 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e6d67ae9f4dab5ea49fac79bceac7a86" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 16156672 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.bias", @@ -7945,29 +6968,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16367616 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16369664 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 16795648 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.bias", @@ -7977,29 +6989,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16848896 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 16850944 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17276928 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.bias", @@ -8009,29 +7010,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17330176 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17332224 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17758208 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.bias", @@ -8041,29 +7031,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17811456 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17813504 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 18239488 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.bias", @@ -8073,7 +7052,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18292736 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.weight", @@ -8083,7 +7062,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18294784 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.bias", @@ -8093,7 +7072,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18296832 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.weight", @@ -8103,7 +7082,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18298880 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.bias", @@ -8113,29 +7092,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18300928 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 18309120 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 20013056 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.bias", @@ -8145,29 +7113,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20226048 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 20228096 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "1a74510bf14d6fc06b53f09ee6a22fdd" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 21915648 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.bias", @@ -8177,29 +7142,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22126592 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22128640 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 22554624 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.bias", @@ -8209,29 +7163,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22607872 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 22609920 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23035904 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.bias", @@ -8241,29 +7184,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23089152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23091200 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23517184 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.bias", @@ -8273,29 +7205,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23570432 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23572480 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23998464 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.bias", @@ -8305,7 +7226,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24051712 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.weight", @@ -8315,7 +7236,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24053760 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.bias", @@ -8325,7 +7246,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24055808 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.weight", @@ -8335,7 +7256,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24057856 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.bias", @@ -8345,29 +7266,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 24059904 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 24068096 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 25772032 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.bias", @@ -8377,29 +7287,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25985024 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 25987072 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "75a9ee23e852e5562e2176a5ece04f24" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 27674624 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.bias", @@ -8409,29 +7316,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27885568 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 27887616 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28313600 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.bias", @@ -8441,29 +7337,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28366848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28368896 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 28794880 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.bias", @@ -8473,29 +7358,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28848128 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 28850176 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29276160 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.bias", @@ -8505,29 +7379,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29329408 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 29331456 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 29757440 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.bias", @@ -8537,7 +7400,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29810688 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.weight", @@ -8547,7 +7410,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29812736 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.bias", @@ -8557,7 +7420,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29814784 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.weight", @@ -8567,7 +7430,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29816832 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.bias", @@ -8577,29 +7440,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 29818880 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 29827072 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 31531008 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.bias", @@ -8609,36 +7461,25 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31744000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 31746048 + "byteOffset": 25190400 } ], - "md5sum": "a2dadce37a87f77e5bc03f6942019c7b" + "md5sum": "da3f4d64dad38aa57a47fd6fbca1a334" }, { - "dataPath": "params_shard_69.bin", + "dataPath": "params_shard_85.bin", "format": "raw-shard", - "nbytes": 30887936, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, + "nbytes": 8388608, "byteOffset": 0 }, { @@ -8649,29 +7490,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 210944 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 212992 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 638976 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.bias", @@ -8681,61 +7511,39 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 692224 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 694272 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 1120256 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.bias", "shape": [ 1024 ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 1173504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 1175552 + "nbytes": 2048, + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 1601536 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.bias", @@ -8745,29 +7553,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1654784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 1656832 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 2082816 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.bias", @@ -8777,7 +7574,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2136064 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.weight", @@ -8787,7 +7584,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2138112 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.bias", @@ -8797,7 +7594,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2140160 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.weight", @@ -8807,7 +7604,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2142208 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.bias", @@ -8817,29 +7614,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 2144256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 2152448 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 3856384 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.bias", @@ -8849,29 +7635,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4069376 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 4071424 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "ca1eb7481171d37cc9fab4b3432d81d1" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 5758976 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.bias", @@ -8881,29 +7664,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5969920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 5971968 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6397952 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.bias", @@ -8913,29 +7685,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6451200 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 6453248 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 6879232 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.bias", @@ -8945,29 +7706,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6932480 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 6934528 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 7360512 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.bias", @@ -8977,29 +7727,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7413760 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 7415808 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 7841792 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.bias", @@ -9009,7 +7748,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7895040 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.weight", @@ -9019,7 +7758,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7897088 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.bias", @@ -9029,7 +7768,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7899136 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.weight", @@ -9039,7 +7778,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7901184 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.bias", @@ -9049,29 +7788,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 7903232 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 7911424 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 9615360 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.bias", @@ -9081,29 +7809,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9828352 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 9830400 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "03be4317a6855a15625866d5dde56763" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 11517952 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.bias", @@ -9113,29 +7838,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11728896 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 11730944 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 12156928 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.bias", @@ -9145,29 +7859,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12210176 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 12212224 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 12638208 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.bias", @@ -9177,29 +7880,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12691456 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 12693504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 13119488 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.bias", @@ -9209,29 +7901,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13172736 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.weight", "shape": [ 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 13174784 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 13600768 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.bias", @@ -9241,7 +7922,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13654016 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.weight", @@ -9251,7 +7932,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13656064 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.bias", @@ -9261,7 +7942,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13658112 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.weight", @@ -9271,7 +7952,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13660160 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.bias", @@ -9281,29 +7962,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 13662208 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.weight", "shape": [ 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 13670400 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_scale", - "shape": [ - 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 15374336 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.bias", @@ -9313,29 +7983,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15587328 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 15589376 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "7464cccd529310def6e3920c637ad62c" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 17276928 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.bias", @@ -9345,29 +8012,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17487872 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17489920 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 17915904 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.bias", @@ -9377,29 +8033,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17969152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 17971200 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 18397184 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.bias", @@ -9409,29 +8054,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18450432 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 18452480 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 18878464 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.bias", @@ -9441,29 +8075,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18931712 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 18933760 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 19359744 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.bias", @@ -9473,7 +8096,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19412992 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.weight", @@ -9483,7 +8106,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19415040 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.bias", @@ -9493,7 +8116,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19417088 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.weight", @@ -9503,7 +8126,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19419136 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.bias", @@ -9513,29 +8136,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 19421184 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_weight", - "shape": [ - 4096, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1703936, - "byteOffset": 19429376 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.weight", "shape": [ 4096, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 212992, - "byteOffset": 21133312 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.bias", @@ -9545,29 +8157,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21346304 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_weight", - "shape": [ - 1024, - 412 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 1687552, - "byteOffset": 21348352 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "8be48481c922751c9b723a99e5dcd727" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 26767360, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.weight", "shape": [ 1024, - 103 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 210944, - "byteOffset": 23035904 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.bias", @@ -9577,29 +8186,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23246848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23248896 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 23674880 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.bias", @@ -9609,29 +8207,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23728128 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 23730176 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 24156160 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.bias", @@ -9641,29 +8228,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24209408 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 24211456 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 24637440 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.bias", @@ -9673,29 +8249,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24690688 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 104 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 425984, - "byteOffset": 24692736 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.weight", "shape": [ 1024, - 26 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 53248, - "byteOffset": 25118720 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.bias", @@ -9705,7 +8270,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25171968 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.weight", @@ -9715,7 +8280,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25174016 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.bias", @@ -9725,7 +8290,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25176064 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.weight", @@ -9735,7 +8300,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25178112 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_projection.linear_1.bias", @@ -9745,7 +8310,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 25180160 + "byteOffset": 16793600 }, { "name": "vision_embed_tokens.img_projection.linear_1.q_weight", @@ -9756,7 +8321,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 5062656, - "byteOffset": 25186304 + "byteOffset": 16799744 }, { "name": "vision_embed_tokens.img_projection.linear_1.q_scale", @@ -9767,7 +8332,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 632832, - "byteOffset": 30248960 + "byteOffset": 21862400 }, { "name": "vision_embed_tokens.img_projection.linear_2.bias", @@ -9777,16 +8342,8 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 30881792 - } - ], - "md5sum": "96daef3567f9842251bb425924ac75a3" - }, - { - "dataPath": "params_shard_70.bin", - "format": "raw-shard", - "nbytes": 4265984, - "records": [ + "byteOffset": 22495232 + }, { "name": "vision_embed_tokens.img_projection.linear_2.q_weight", "shape": [ @@ -9796,7 +8353,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 3784704, - "byteOffset": 0 + "byteOffset": 22501376 }, { "name": "vision_embed_tokens.img_projection.linear_2.q_scale", @@ -9807,7 +8364,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 473088, - "byteOffset": 3784704 + "byteOffset": 26286080 }, { "name": "vision_embed_tokens.sub_GN", @@ -9820,10 +8377,10 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 4257792 + "byteOffset": 26759168 } ], - "md5sum": "ebe2947681e943d49c3e4fa08218992a" + "md5sum": "91fb7eb9ed733756ed0c89a04c1a2657" } ] } \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin index 4025cd19f474d8ca26dac8b4b67dc02eccaa945e..4db95ad13b46f9a19349eac42574b7a188f760e7 100644 --- a/params_shard_0.bin +++ b/params_shard_0.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f579d855dd806bf4b8a6fb927128443c6557f1d513cc34331aef4b9f0934bd1f +oid sha256:5b945da96e333c0d0b1044c498f977ec149fac30c96adf00a22475cb465acc75 size 39502848 diff --git a/params_shard_1.bin b/params_shard_1.bin index 80f6ca345bac3c1a682cb13c228816e8df1abf83..eacce3d2d693c4c9466910ba883a65e0f166a8a6 100644 --- a/params_shard_1.bin +++ b/params_shard_1.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b66d46f5ad15f3cec6c435c516d5bd45b2ea46a47958b285256a248d600e4012 +oid sha256:250140da2d37c612f22aa1323269dd02d0938ee55e4424d969d64db03fbbce04 size 20185088 diff --git a/params_shard_10.bin b/params_shard_10.bin index 50201563766a2c2d81bcc9d07e7c42d7c10da2c2..3efb385e66657f4ecf14a2654c4cce3e7b1075e2 100644 --- a/params_shard_10.bin +++ b/params_shard_10.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:15701f63d0de813f64fe7ca4e3bc5e538eda66169e22927ffe6ad1cc4902e895 +oid sha256:ba1bfc1dfb79349b1c6a6ac43624ded945e8f5b45981019d5bbd4e13a4dd9e46 size 20185088 diff --git a/params_shard_11.bin b/params_shard_11.bin index 33a0ce55f38cb1702f7bbf50a728855d5a3ca9a9..2b7950b9cf14cd4c6dcfed2930b2c396919c9d1b 100644 --- a/params_shard_11.bin +++ b/params_shard_11.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:225db11275da6d235388a05060d7ce7f01155b4a6bda08aa815b936d5fc17b60 +oid sha256:1e6c95c86d9e8dc513039bf5687aec3e343ea0b4bdd1772e40918a998147d5f9 size 30902272 diff --git a/params_shard_12.bin b/params_shard_12.bin index b5b197fed1c26b94894647107f858949961342c7..0db504e993d85af173b355c592a3ed69a6a0c8ae 100644 --- a/params_shard_12.bin +++ b/params_shard_12.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:62302cfdecf5403d791ff0996b6e7be86000b597d5795e0bc97e62794763f75d +oid sha256:0918d49b599d6952008757b1b7d56a323722327adfef5158178f225317ed975e size 20185088 diff --git a/params_shard_13.bin b/params_shard_13.bin index 4f7100fdeda0fdf0b3106228e747585a1a8df254..4bfd867154a18b967cd9b1be7db8d57378b50f0a 100644 --- a/params_shard_13.bin +++ b/params_shard_13.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7d6ad505b5a4fde8d85ea64eb20a98d3afb1e61b811cb6ea9ab3713a77343c9f +oid sha256:fc8667809b73869528a882dc58e30aa71cad08bf51f11630b1fe04c9c989415c size 30902272 diff --git a/params_shard_14.bin b/params_shard_14.bin index a0e362f8c7829688df34924292096d23eaf13ec3..ddb0fd4d2af4a36cbc0dfa93781a6c96c007e00c 100644 --- a/params_shard_14.bin +++ b/params_shard_14.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:82a2889da1f5f199911932cd991407bfc85dcd425468bedd47f366752a4184bc +oid sha256:b4d73f3869400b506d24b2336bee777f2591198dc89beee24824e07bf62dcf0b size 20185088 diff --git a/params_shard_15.bin b/params_shard_15.bin index bde9dbe1976d98a532e83bffb7028444c02a9d47..f19c7bd8c3e0c8dc1bf7c48c162f80786eaba3b4 100644 --- a/params_shard_15.bin +++ b/params_shard_15.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6e1205031513c2a6bdc92856eaca3107259e8b0b1222ea8b0145483cbf247660 +oid sha256:0166f4aa2dcf5da7a10c45806e0ed2d26a829b849230b85775b502298cfa5c18 size 30902272 diff --git a/params_shard_16.bin b/params_shard_16.bin index b2a937a2905ba94a9dba0e56988f60623e4c18b7..82ae72c399dcf4f609dc0bd30dfd179bc945a26f 100644 --- a/params_shard_16.bin +++ b/params_shard_16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:28a458fc24635a9ec856edeb447002d0fb45a3f69ca5899218e9654c9b7df54a +oid sha256:dc0ba170d872a37060cc7900f9da0f59d8655d17cbd976ec731843cc89b3c2c1 size 20185088 diff --git a/params_shard_17.bin b/params_shard_17.bin index a88708ed627ea8780ad8f5e0d2ce54ca5faebfa4..1cdfcd0c213264d9695a6d9a05ba8f95210cab40 100644 --- a/params_shard_17.bin +++ b/params_shard_17.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:85ea113c5184f7306bf8394f35bcf8f34b9982e1ed3447af0f26e21307f7a71c +oid sha256:071bc32bc5e77580050866332ca62b5c5dbb5a4ccdf173a2a224414f238b0fdf size 30902272 diff --git a/params_shard_18.bin b/params_shard_18.bin index 457004e0a9967742c928f13a42f6bf1c019a191b..add98743fee5c3d0a5cdca487c342516de2dfbae 100644 --- a/params_shard_18.bin +++ b/params_shard_18.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2b26dcf626362025760a311973c990d557f9cd5efc5f19b9985939f9deb13d8c +oid sha256:66820a3ebeee1f4bd090c0fd4489024564d0584bce045cf5c75a977b0ff52fc2 size 20185088 diff --git a/params_shard_19.bin b/params_shard_19.bin index feb94f130d1ccbdb574e4be1052308db3350b2d0..25415892dbe7c5692ff2b7259487a23816fa9aca 100644 --- a/params_shard_19.bin +++ b/params_shard_19.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d02100ccb08d4e257bf2f7b95c052032c4d3be787e0621af78c7ece611b90db +oid sha256:f9fc9e86e7774965dd6046f177d7173c1b63d45a136ca44afd99e2faea7f2c96 size 30902272 diff --git a/params_shard_2.bin b/params_shard_2.bin index 5ea6e242d60201f3eee16588d6b0e83e65fd53f3..8f5fab3369861446870fa97f2d5715e567e9a80f 100644 --- a/params_shard_2.bin +++ b/params_shard_2.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:13862d8f0ed8f0cd41cadce7e2c504957e9f19328ebd76d71f753cd5b09c7fbe +oid sha256:69e09fe9b54a99bfffda5893635344401d3644950a6074270d0c295349fcc904 size 31588480 diff --git a/params_shard_20.bin b/params_shard_20.bin index 65b0186ea34ef9dd1dc79af9e2cb7a0990743503..8e98850823cea14c84c81ea3f3204a3bdb5baf50 100644 --- a/params_shard_20.bin +++ b/params_shard_20.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03a3b6080a190abbb340a49a3381e34534f554178e785a2001da91f810bf1a99 +oid sha256:33145fb5e49e431d7f2c98b687d2d8d5a568aaba6bae09d6ad599662fb740d35 size 20185088 diff --git a/params_shard_21.bin b/params_shard_21.bin index ba846131927e75c3038e0584a76207cce9bdc5e6..4af7a822b0bf2c30638b63e2c30ffa41dbeb3473 100644 --- a/params_shard_21.bin +++ b/params_shard_21.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:abcdfc7fa756af576fbcbd87f2063656cf657793af721cd22ace8e4733689172 +oid sha256:9d52461369d6716bb044a06ce2203c962032e735b3056c598f78b3778906edc7 size 30902272 diff --git a/params_shard_22.bin b/params_shard_22.bin index c54a624f953d0e59b8d50615a83e3ec60a14ffab..da1636f398045e1c8b67eb09e7472d317140f548 100644 --- a/params_shard_22.bin +++ b/params_shard_22.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:12e47ead37ff482d777f049f40592b1f2f6d28fa5b2238d6a9360e5b96b37b7b +oid sha256:8b11e199aee4692ef58e9fee1bfc90fac260faf32e354eec0a7c51f2a5b4274c size 20185088 diff --git a/params_shard_23.bin b/params_shard_23.bin index 807d2347944e9e05b7345d2a72072dc3b4d64215..32a24a30c8e753920e54e4fbf5d985fe4bc44e93 100644 --- a/params_shard_23.bin +++ b/params_shard_23.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1783ba939b4780a0365a1d4b278219c2de0c29481c04bd3537aa1e17b63735d8 +oid sha256:50be5f38a4d455ac6158392f31b3c40d4cce81351fe7e4248e519b0592a2d438 size 30902272 diff --git a/params_shard_24.bin b/params_shard_24.bin index 6b11db1265674d818a10c4127faadd89a1b2e093..e54d076052fb219f7b24a0d9a51648e136b5ac2c 100644 --- a/params_shard_24.bin +++ b/params_shard_24.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:04a6127449b9c7e8507e3f479c2860199580b5312839f817df8272abc379e789 +oid sha256:e97b8595b4cc9691b13376ea4d0ce15830b2d40172d23fd457ab18c21a1b7dac size 20185088 diff --git a/params_shard_25.bin b/params_shard_25.bin index 36a6f040a83f8093cc39a52fd0672bca1fddb552..efa6e685c31aa7041ab2a76dc82a25fc15955bb0 100644 --- a/params_shard_25.bin +++ b/params_shard_25.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f27238deb725c1a3cd5499a0dc9749ca89923c0dc338653e13bb2964e1081f0c +oid sha256:1ffd33ebd959a299c851dfbe51dc407faf000780c376b8f21f73b8a52353f1cd size 30902272 diff --git a/params_shard_26.bin b/params_shard_26.bin index c64c1ab1787fe9fa2a897019c08569cee8c99a09..c9c0d66dabd89e6614ec43252a84ffd488178f6c 100644 --- a/params_shard_26.bin +++ b/params_shard_26.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:015c0dd453c31f66e2eb4dadacc803023554bd9d3d9dc0afa32cb210bf1ff1ef +oid sha256:b2cd782c32e0b33efbf69b7f2f4512837d3fad41a0b0d1415af7c90fc673ba7a size 20185088 diff --git a/params_shard_27.bin b/params_shard_27.bin index 7fe19e19197b5e12c85abb705542e5d1c3a45920..49d620ee0286201f5be579b58294bb055e295dcd 100644 --- a/params_shard_27.bin +++ b/params_shard_27.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b2d595350e4af88c3152621f262e46a588bd8d72380b0bf3714881cb1faf8549 +oid sha256:18ba431c68b9e8e93424947a1c9091dde73f75580e5a2c813584fee68156deef size 30902272 diff --git a/params_shard_28.bin b/params_shard_28.bin index 7279417be136ec80e3cbfe3ae24ea0c8b5a94604..449773c8bfa6c60f5e704111a29d87bcc543a3f2 100644 --- a/params_shard_28.bin +++ b/params_shard_28.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:01e32f71143c8a3de679e32ca62425ad2c55ca2b58270dd41124edc36a18a828 +oid sha256:a8d9f02ce047551002c5fe0e2a2baabc74ac9fece3704083fb64d9dbd839605d size 39502848 diff --git a/params_shard_29.bin b/params_shard_29.bin index 4460aeaccf569dc509e507dcb0b6d92789a2d047..39ee17f7ea474640dd47655afd32e4b18ec88775 100644 --- a/params_shard_29.bin +++ b/params_shard_29.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e87c7d95a461d0e245cd1a67694de5223dade5c46ad58fabde1d491a697b4973 +oid sha256:28533b0bdd59009f65f602492f27c1c75934297dc4a198fb77993aa7738acf20 size 20185088 diff --git a/params_shard_3.bin b/params_shard_3.bin index 210e9d24c3ae9635938702b1eeb858f4bcb66ba5..da86324f750ee4412360e9989d9434ab523394a2 100644 --- a/params_shard_3.bin +++ b/params_shard_3.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2da35810d2c61ea848f7d593755dab3e2c82a139ef55c5bedbd390f356faabd +oid sha256:11ada41e574256e45c0be3c20cbe1e46ecc948c4f26310c9ea27941b7bacb434 size 31520768 diff --git a/params_shard_30.bin b/params_shard_30.bin index 467fed22b9e31d63f15969b1b37b7e599aa1ea4b..a03fce6f80e3cef7e4e1735e9a1c2891523e9fbb 100644 --- a/params_shard_30.bin +++ b/params_shard_30.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:db2a83cabc750539a713527e323abd35bc0adcb2910d0ce78173a51f7798afd2 +oid sha256:3c4744ef031633e844a076bf71d1d6b6bff507de34aac1d9ee09b4a2ad65640c size 33316992 diff --git a/params_shard_31.bin b/params_shard_31.bin index 559fccf18b30cbbd44d2176a315d30845768aa55..cc53a6baf3785253bfce2a735cbcb8b1c58c2e8b 100644 --- a/params_shard_31.bin +++ b/params_shard_31.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c57c20b916364d129f560879a3d082aa8ff99b17ae0cf6dd2cd1c6fc2b503514 +oid sha256:262d2ff5c92fbb420276bd3da76ab7650a7dff08afd712402690cab22ac196f5 size 20185088 diff --git a/params_shard_32.bin b/params_shard_32.bin index c46b2a85218c6656f3cbead56b81d0199909e247..d64e0fa1a94e19306c375a8fc3fc526c325efb5b 100644 --- a/params_shard_32.bin +++ b/params_shard_32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:72f07ca8b0ee96ea2eae4a585aa25256f356b095134a01a3ae1d6341e6bbb636 +oid sha256:a3848bda728101c29f68b72c6ce06d94e14fb1d18eca89c05ddf0b5b95774b64 size 33431552 diff --git a/params_shard_33.bin b/params_shard_33.bin index c26f90e41ccc8912d22fe91b04be9521e40825ea..7c04f34e00291c265f7366c4260dd58769e417b1 100644 --- a/params_shard_33.bin +++ b/params_shard_33.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ad1c8e60ad54ee57c91a6ded0d82902ac08db973ebfb4634f54353671e40b227 +oid sha256:b6f425e610af02153f4c31be5595b432351ee309de2695a3a8c019e32c8ac1bf size 20185088 diff --git a/params_shard_34.bin b/params_shard_34.bin index c7957aa124c214ea2e12be8239d8c667c45898d4..e4aa176870cba1fa80aca6704d01387bde738ac5 100644 --- a/params_shard_34.bin +++ b/params_shard_34.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:794a76b428e274e3786277f0fa00270e07490b1a4696022aa81cd7ab92b5a217 +oid sha256:aadb65c4310c997ebde31a1cb532f641999cc746920c86129d459c4ef04b3855 size 30902272 diff --git a/params_shard_35.bin b/params_shard_35.bin index 0982d9931b625499363fde7f2a8a53f20eed8763..cb7131df1a6326ea132b3e2fe0b245f823642b93 100644 --- a/params_shard_35.bin +++ b/params_shard_35.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:87dfef5e13bc89ed9a4ba85602036732e91722c4f65aebc6c2a39916f7d3c487 +oid sha256:780b102dbbb4a5ba238e06054c533fe60b01622424341b599397464313385bb1 size 20185088 diff --git a/params_shard_36.bin b/params_shard_36.bin index 9594276d1dc332d55f4f34ddb6790b33772d9103..03699799bdb8cb05e20bc8c18ce9e1a254fdbaa1 100644 --- a/params_shard_36.bin +++ b/params_shard_36.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:48956743ede24d442a2d532768b62eebdc01a7e96272ed3d0d74ae4ab85b61ad +oid sha256:1e312785a8974c2ff62978f1a32363c323041f2619ed6c2da840020d07f7d5be size 30902272 diff --git a/params_shard_37.bin b/params_shard_37.bin index d1662910d8c4fe0e27e281a0da27c8fe269d0359..b891ef65ade4ba758a9f4b7577726df3e474d354 100644 --- a/params_shard_37.bin +++ b/params_shard_37.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:04f7a29e40b78cf20b5e2acad6c831b8bd3a208779f8a4c0c54855a0cb7146af +oid sha256:9bd3d96ea617ce74ef1a100b9ac082c24ca2ee85db06a71e6b1adaabf311f879 size 20185088 diff --git a/params_shard_38.bin b/params_shard_38.bin index f783bdd292d23b4380faa0d29334476ca8fc616d..caf59d20cf5c0497e8037616217885ae199d3578 100644 --- a/params_shard_38.bin +++ b/params_shard_38.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4b00175382927b1312272fbfb1d7df8f6903629459d1f93dedb65314d97dc79d +oid sha256:eade88d5bc15a4129f71223387b362d28c360d032887cc4553e58c196aa6b2cb size 30902272 diff --git a/params_shard_39.bin b/params_shard_39.bin index 9f3a780c67805bc240e66fcd663c3cfc42be6a8a..f4e3181c960f8f3d59f3453750f0346c049c266f 100644 --- a/params_shard_39.bin +++ b/params_shard_39.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:879e29198c9a652bbf0d2d0f30adb96643e225246969e09bd4c21beb8825d8b3 +oid sha256:032a32db5ab531f392334e01e6c6d04204d4b3a419c09444b14bceab26396f5b size 20185088 diff --git a/params_shard_4.bin b/params_shard_4.bin index d7446324a7dcc7c2f0a7340ed7ee9d195d358755..3c72de8e1a18af442c88c93837dc33b218f86332 100644 --- a/params_shard_4.bin +++ b/params_shard_4.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ce5fb6ac83872abe400dea5a4486031e66c29bd6e1256d5b2fda2b379cef9b2a +oid sha256:3c298052f8beb1e2928ae94226f2ba8906092da99916170bafe85dc172f6c8a1 size 20185088 diff --git a/params_shard_40.bin b/params_shard_40.bin index a6da4aecf97925c5b80f9dc0003a579eda8f8102..b35050026241ea24fe88fa717bb995f7548616af 100644 --- a/params_shard_40.bin +++ b/params_shard_40.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b226e2531e7ab87361812e06246bea44603869d95b58b92e8f12cb40374a8292 +oid sha256:5d72b8139b61412d9a65a799de30bac64efddf84f8cb7f87295d77e0cd169dee size 30902272 diff --git a/params_shard_41.bin b/params_shard_41.bin index 640fec8c868f201067cd693e68b3c374be2b6c4b..8d3fd39a85c9ceed3ca91cfbed7915369f4a5b6a 100644 --- a/params_shard_41.bin +++ b/params_shard_41.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4d97cc6abbb295e2d7d6193eb5e49f2fcd9f53fe7aa929113df52cfacf27b026 +oid sha256:6be43090e3d7b36182fff92b58ac4d28f38500577a4ba3b592da559dc951b374 size 20185088 diff --git a/params_shard_42.bin b/params_shard_42.bin index 57cd5535e7092dfd5d7b1172548870b685823083..3838b35c9c07711ef31e4102d2b3708496e2b532 100644 --- a/params_shard_42.bin +++ b/params_shard_42.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:65dd615d75a86aff8d53b109161a11fd12f29886b267f6a123ce5410ce55f32a +oid sha256:195386caa8d8546cdbee823dbddedf9bafcab6aae213ad486d11bc899d9f06a7 size 30902272 diff --git a/params_shard_43.bin b/params_shard_43.bin index e876bab616ce96c641499bd0a5799df4846b5ae3..444e61da68a6fcf0d7bbd6d4f664a9ca18d922b4 100644 --- a/params_shard_43.bin +++ b/params_shard_43.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1341d5910ea7339b539476818686f66c977ede2b34693cce8ad5c8c2ad3628ca +oid sha256:3f3952864f25aaa0ff602a6b3e59c0f44f7db5e2c47eb5244ecf5d6e5ae2c168 size 20185088 diff --git a/params_shard_44.bin b/params_shard_44.bin index b42e3e0c3056f60ecc842e34df0db058f7380dd1..db97f975ae11b83fdb7350c19087030df1653787 100644 --- a/params_shard_44.bin +++ b/params_shard_44.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3184b7ce5a155d8126dccbb437c621d0f71b6e9695de807a91ff4a4c95a4a30f +oid sha256:283681df64503712b485768659657c188d5c239a5ce9cf545778d541ccfe145c size 30902272 diff --git a/params_shard_45.bin b/params_shard_45.bin index d37675816bfe8b5303c9268e5a22a715d50b35e4..110563df70cb7a05be918cd18161c761fe0d6f22 100644 --- a/params_shard_45.bin +++ b/params_shard_45.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:863acf25ff22bc4b550f798f4cfc506eca756b43574836368de66b3b47f95d41 +oid sha256:2401077ba29bca53a78501154e0e4e153473ac28429c76bf6e7645b59dab2b4e size 20185088 diff --git a/params_shard_46.bin b/params_shard_46.bin index e9ba1c8248ced343448f7fce0cfedf3d8eca82d6..9058b251d4a918962d5069df02f7bde79100950a 100644 --- a/params_shard_46.bin +++ b/params_shard_46.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3fc1d030dccf97f73de95a24064934352eb25eecb4875247bbe1c4e48ea8855c +oid sha256:7f8630bc7d1d9166be54e3d51015e16ddf1a710be3dc4b1c4acb53b6b03bc02e size 30902272 diff --git a/params_shard_47.bin b/params_shard_47.bin index 4e0b575a82befcdd04e1921bdaa3dbd0ed31272f..1cc4b5d796f717dc82b3e3f3e688236149cf8fe5 100644 --- a/params_shard_47.bin +++ b/params_shard_47.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c297b8c576d9d793a7739d800513ae1147105e4015554e8831582b35f4dcbad5 +oid sha256:371a059bc91a1b587f6c33eeb38f15b76b1b88d2dd2063164475f92a4c48273a size 20185088 diff --git a/params_shard_48.bin b/params_shard_48.bin index 2e69a63dd41641aa63066ba46e485de35fab91ee..39dc0730f78c4b314c1d365390fd1c28663c4390 100644 --- a/params_shard_48.bin +++ b/params_shard_48.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f4c4a947e812d92fff32cb51039bcf95e326497620ae26c6e6a4beaf458236e9 +oid sha256:d376abdff694588f8c8cdd832b772a2f6dc2ddb6aa86947cfc2d8c08b2606b8a size 30902272 diff --git a/params_shard_49.bin b/params_shard_49.bin index b494681565b3643be2f8fab3d25847a465597ada..5dac1142f8f415c60c001f8e1fa47265c37344ea 100644 --- a/params_shard_49.bin +++ b/params_shard_49.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:76038a354513e6181734a393fce81ab261c1d6e12eb1d19639fa56d9f42a68c4 +oid sha256:b9eb3a371ada23069368ebb908ef2b76baaca0aaa67ca9ba218caa558493cc87 size 20185088 diff --git a/params_shard_5.bin b/params_shard_5.bin index fbd576ca06a716792e571bd7a52ab2c49a886724..9583244510fb98abcda6bfd5111029027631f380 100644 --- a/params_shard_5.bin +++ b/params_shard_5.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2bec36b4ffc56f08cde90a20ea416ef61ccfdd11dfb96bfa2a7dbadd901900d9 +oid sha256:26aa07148775686c62038ad9395d7ec51b50139d2e497ffb2a08ce2b9771aea8 size 33431552 diff --git a/params_shard_50.bin b/params_shard_50.bin index 1c94fc51f9018111e43647678a87208ed78adb30..ba24fe464c2b8d7acdcb148711c5555bfb619f43 100644 --- a/params_shard_50.bin +++ b/params_shard_50.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0fd10613af6efe2908e970dc11aeeaf3841f1a31aca19b8d6c0f85253fdb8147 +oid sha256:04c09717c8e52ba7626c00e4e9f8db25a41a86075d948046df43b5b30c79451d size 32630784 diff --git a/params_shard_51.bin b/params_shard_51.bin index f0b6e91cca8d172aa5738b334bd52d402a885ec2..04e60b2ec0fcafdda05a89a3ea4b3fea5c0f52d5 100644 --- a/params_shard_51.bin +++ b/params_shard_51.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1529176c7c2809eb850c244600e35fef0f7a4c533606df32b78bb680e814b119 +oid sha256:d58a57922b6de90580e290e00c6ef3ebdaaa3889dd3b980355f7b9519a500b97 size 20185088 diff --git a/params_shard_52.bin b/params_shard_52.bin index a377e4d71bb999008aea2cacf1afd35b1a3d5426..17ae2690d21d1286a4e7d1b3fac7254c2e61572f 100644 --- a/params_shard_52.bin +++ b/params_shard_52.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1e14ab1e568e6237719a645630e6c3ed82830ac4ef4f3a5fd1458371e7f34d9f +oid sha256:02da546167083422790573bb7b199f2a4fd72ced025e524f079a568d54faf0ff size 33431552 diff --git a/params_shard_53.bin b/params_shard_53.bin index a6f485952c4ff84e443dac1da99bd6c2eadd59cf..b7a98d14ef14df37c686c5607d60fea49e84ea9c 100644 --- a/params_shard_53.bin +++ b/params_shard_53.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:28c460f4d14b087266f5ccec95069f120ba289240ba90389d51187accdb556f7 +oid sha256:246ea7931c1af8029364800595b810c33ee4cd4364648b902fffb07f4709a965 size 20185088 diff --git a/params_shard_54.bin b/params_shard_54.bin index 87c321585f9218eef347dffe6fb59c6d5ff2f5a7..3bfd4dac5d2c0e1add3651f923c1dd1becfd7999 100644 --- a/params_shard_54.bin +++ b/params_shard_54.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4a5b9c6a422d2abab3e0a4633910737b3c67a04b3dbce07515bc3ce00d94b2b7 +oid sha256:1ca5f6aa98ae34db0a8760b95dbb52050fe91da70dbb2781eaa435edc3333236 size 30902272 diff --git a/params_shard_55.bin b/params_shard_55.bin index f1ae8aff5aefbd8264075c3669fd3e3ae88d2ec9..0aa5f2edc8801c1f5ff46ce5486cba1a684112c3 100644 --- a/params_shard_55.bin +++ b/params_shard_55.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1d07c1f718532235e42eaca6a7eb9e1faed5c52b0155ce8511ae784362d87370 +oid sha256:c700c33f7a1582c4ba6a8f35acb15b44cafa668100efad9b196d521a7d13dacc size 20185088 diff --git a/params_shard_56.bin b/params_shard_56.bin index 92997fab017cf92c1b5606be9735f34fdfc1bfd5..bfe0f46a60de379c48f99a441de9954fc46a6474 100644 --- a/params_shard_56.bin +++ b/params_shard_56.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c088149ab835245d19d2d30cb60516383a2148d355e17a1e0809eeda3face5d0 +oid sha256:2aeced53372221ed3deed42ff7fc131a0cbd9558fd3c37d74cf852b5faa19143 size 30902272 diff --git a/params_shard_57.bin b/params_shard_57.bin index d3e4fb31f296d614a194331f67d5aaff65baa365..61e064b9451682008caf96b5808751e454c15dd6 100644 --- a/params_shard_57.bin +++ b/params_shard_57.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:37e8aba45320e5c6d1c1d1f5c3413036e609713a6008711fb235c39203eac2b1 +oid sha256:8042be0eb47af8c70338e5e246458a0be2dffb72e1b7f87705986f42c6dfa423 size 20185088 diff --git a/params_shard_58.bin b/params_shard_58.bin index e57e5e2af6147e743cfe55779f944efa371ebb24..123677d00f0e6e89023195c5753c3f31531cfd03 100644 --- a/params_shard_58.bin +++ b/params_shard_58.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4a6809be8290b1d5d5e7e846341565e99a11da4ae40c241885a0fe51eba3435b +oid sha256:567cd616598eed39862c18e3d6b796576cc4a9148fd82791bbc4eb3ddce0a6d8 size 30902272 diff --git a/params_shard_59.bin b/params_shard_59.bin index 4b5e1d5bd478159705033fe320e9fe9ce621cfe8..c38947e778e94a90eae799ce833ae29ae253bd51 100644 --- a/params_shard_59.bin +++ b/params_shard_59.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5d19d9b5f517e8700eaececc01e1d70d2476fd30d61a35b971b181c1a5a2b8b0 +oid sha256:7d2dbc682faa663cb6761c05d9ca7a2852d7c3ec4208748d8d70c89071bff9bd size 20185088 diff --git a/params_shard_6.bin b/params_shard_6.bin index 62ae5538a5d628b6e6f61d9f61423b3491ace618..1d5cf9ff9cf13291fd8d04d2bf1dddc8178ed4d3 100644 --- a/params_shard_6.bin +++ b/params_shard_6.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2342fd4d9104a3b522551c70e9d28be22e94f82478ec5301c70c00d85cb1e361 +oid sha256:449ba7704c064c79938cb27c407c6000ccd2441bb1149e7f8d5a744fccffee22 size 20185088 diff --git a/params_shard_60.bin b/params_shard_60.bin index 026d52e27e4566ce8e11af0a98a271a240831f8d..474f26625815d2d27ae3f373de116c3d4d2725ae 100644 --- a/params_shard_60.bin +++ b/params_shard_60.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f3c8db51f7fee529e9d30c1c772ffd5a346664d7fd49dab268fb014d4de502c0 +oid sha256:4d9fbcae26804be3588eb9797d6d64fa0fddb63f3aac34a04f8303c2b9e64f02 size 30902272 diff --git a/params_shard_61.bin b/params_shard_61.bin index 97770f7574a0b79cb04cf8ff8a17341f87f2115c..328a779bcc446159697804d57b38d55b777b9b27 100644 --- a/params_shard_61.bin +++ b/params_shard_61.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3289802a1cc5c722c6b7df36d347d7dbd6ace9f3e469c10e1e75c4347a08a1a +oid sha256:d3433d45e53d634b6773c0635a6a0530a2c22d2a629f5286ca50a0ea43a5eeda size 20185088 diff --git a/params_shard_62.bin b/params_shard_62.bin index b722cbe22f577826d5c61651fb617f0e7dacb206..494da8d11f1a8b4bba3132222f5b96d7583593ce 100644 --- a/params_shard_62.bin +++ b/params_shard_62.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:58c7f585352241c4f2fee1e88dde71f3bb30af0f01c997e67e7b64f1a1b2cfd5 +oid sha256:460e9d933e3364d50999c4c52dcd83dc7217ac333130df4ba233cc09175712b5 size 30902272 diff --git a/params_shard_63.bin b/params_shard_63.bin index fc4ff5fad075b65da8c169ffdc114f546596936d..c5fb37b54b08e854fcd4f19ba659e20293334af7 100644 --- a/params_shard_63.bin +++ b/params_shard_63.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6da01a94514b2b11f687d30f8447320895ec5e0a1629ba1a323379fa69adb52f +oid sha256:3d79752e940bac46423a096c259bd23444fe6db87a35469838d134efa8ccd9e8 size 20185088 diff --git a/params_shard_64.bin b/params_shard_64.bin index 9c4eda700f25e2a2840776eb1e3ea58edadeb600..0d5996a52f3f9328dd7ab4bff611dd18ccea0de7 100644 --- a/params_shard_64.bin +++ b/params_shard_64.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cb7b6c44c2b61105e614eeef72502f2c31b4d77b8ef56c8cb8c43edcec7861d3 +oid sha256:a6343d0b1c5e7dc59fbbff4074f005eba7e18b85ad616253fbc5e605af68131a size 30902272 diff --git a/params_shard_65.bin b/params_shard_65.bin index 5cd82ef303e5a0167512261c23f1e05fc9d21a7f..e9bbb5d4855d6b584b6578a5baab28b87790901b 100644 --- a/params_shard_65.bin +++ b/params_shard_65.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d3006b47483b850128e42e0585d4a22ffedff90e7bd5447481f8f6f59da0e27a -size 31968980 +oid sha256:8100388f01058fe0cd7fd4f101408a0f92424a19a1bb43960f9c17cae8b3aa55 +size 27834368 diff --git a/params_shard_66.bin b/params_shard_66.bin index a4f7e30108b5a78defa2b33e06583c8d4d83f17c..59811b282fc7444ac981a47824ad41bce4939b94 100644 --- a/params_shard_66.bin +++ b/params_shard_66.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:54edea24e976bb3eb73ede96ba66306db3b42a5b231e330272365245f6d6d901 -size 32634880 +oid sha256:95f92d7517fff429ac6464ed3de54b841aafd2e1b96485d8edbcd6f0f5c9892c +size 25192448 diff --git a/params_shard_67.bin b/params_shard_67.bin index 96e96df357b464fcfb9877d518cd098bf66efa01..d4459fd39922dec7c841f7b8c4fc14cf554e6364 100644 --- a/params_shard_67.bin +++ b/params_shard_67.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:706ee7a24bfca1cccf248f14daee4900a8675b5861bc4657c60295cfd970cb09 -size 33521664 +oid sha256:2907f5074bdae488baf0179fbd0d3a9703b8925d6aa26c19072cf39f30632a52 +size 25192448 diff --git a/params_shard_68.bin b/params_shard_68.bin index 6dc57a3bcfe6ca5825cab60f2d21ee9bbff519ab..3a09bfb8ad77f262966a65a055c39cb93804bd4c 100644 --- a/params_shard_68.bin +++ b/params_shard_68.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e48fd5b48fc504959cb75f346f4a666667520c7252cfa2c2628fdd068c726fff -size 33433600 +oid sha256:e52258f6054bfd1e5a63f3009d47471e6997e28b096182a3be103002625e7b5f +size 25192448 diff --git a/params_shard_69.bin b/params_shard_69.bin index 6153ed702ce66599a79226985df9f95a90d6283c..99688b0c0db89f44b28bff638c846f0db53e719c 100644 --- a/params_shard_69.bin +++ b/params_shard_69.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ed032360167eaba942c34436fa056750958646389d1282a51faafb84daf2aa32 -size 30887936 +oid sha256:dd9acd6c014a0e3e3a897009cb53798fc88b404b1716927528c983fb1c209506 +size 25192448 diff --git a/params_shard_7.bin b/params_shard_7.bin index fec254d57f9d528f5a3577446d908fe3ef5060b0..0b623ff90d66711bbbd55ad6e29288c026be5261 100644 --- a/params_shard_7.bin +++ b/params_shard_7.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:427ec72aca90f68b955af8213e882315550ad9fd8c88d23e62818a0f7af837cf +oid sha256:e4d61a60f24694607887e7a9dc49068402282da49b6601621f8f4b1a3d87d469 size 30902272 diff --git a/params_shard_70.bin b/params_shard_70.bin index 767361d2f6a1b7f12a08f7756959f613a98ee82b..8feb427823459689c69aa930cab2a23292327a4a 100644 --- a/params_shard_70.bin +++ b/params_shard_70.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2709ca772f2a56d391a90be8dc84ab2c0a72d944ad28f606ebcf43d877817dfb -size 4265984 +oid sha256:b98c509c9dd6d2d651ce561a1b40b9ed54da611a1dee3b301939ce644f8ab5f4 +size 25192448 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..5d23a29ba623e1bd9cf07a33ec4fc4187cf240f7 --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a393ae05270bacd4e1bfc159c658dc0c2d120c62b74814ce0dcb4e1dc6adbb25 +size 25192448 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..72f9664df124f76c21c700903e633730d1f752a2 --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961c95cae2217b3f91ae66dd5bdd217a3786570e08e92526a0ed1e31a9d0a26d +size 25192448 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..98c06b0966c3bdb1b9fdb1479b91754bae3ca839 --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa58db84fbc3b6cac71f8d43b11ebc7ea23514a9759fb642c4424107ebe52ef +size 25192448 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5f3a209d8fea02e4e3b71d5d4a8753800f04b4c --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe8b445092c0315182349dcad54cf7152c561d2238ae565e740576c766da99b0 +size 25192448 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..4351b9bab50d16bc35d02d66f1a957cc48a9b0bb --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44419c11afdfe4a06d2fafba5568f054aa4d01d580291b9d5978c36951fa14b7 +size 25192448 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd692928a5e2b04d81dae5f4ce877fe46b39bf12 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe50070e333c5844a40ba3a6961a2164c2a15fa53e554848d4f0c7d1819c819 +size 25192448 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..15df2cd29ab48348b42c74fa11c4ae4e546938a7 --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c8111bddd12144adfa3a8dee1a21d2c9134f5f94179aefac6d3d6d5a08eb623 +size 25192448 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..767cc22ad290c9e6ef407055a0957afed85a139f --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3a20952446e3802dcd8392cf071e9d5427d1287901517af125a7bcb6d68722 +size 25192448 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..c499622903ea5bca9e07a1cd29211976deac6361 --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c10de3efd24198d9211e04c07fa0589647f24ec9c2b23eb79c05b1c03913e77c +size 25192448 diff --git a/params_shard_8.bin b/params_shard_8.bin index cd98e5b8f02c1907bcfb9c13f111204eb44a87a2..30006fea889a9f05e8b995c2659341613ba3c70b 100644 --- a/params_shard_8.bin +++ b/params_shard_8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dcd946de61c6f8e7523b1832be58ffc86f10fcd49b4d541649aeb89459f94985 +oid sha256:98535f2c2c32d20dbc0abe49145d86c73a421d380bbf346d82465f89c3e8fdfd size 20185088 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..27702db0ef554ab6dc3b1cfd50382fdf89a86644 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25823a9063b8218a1d3d11d18be96984a5f798e8efc1ac26b97083dd369c308a +size 25192448 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..efe41e5de5cadef2fd1f04e22ecb210a5ab0caac --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f917a43ac21c3f03b0dfb3c3ca797dc6e95da24d37659e88d823aa4cd948ed5e +size 25192448 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d0108c8f2d520525574269cee045e3f3c9e1de8 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd89aa87467417fba324dbc57251fb8af684b86da3dd5ff95fab8eedf31325f +size 25192448 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..b61a1190637f49ce4ffeedbe07da73ba69efb144 --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7957183ff6d4b77bba3b349158d2d0d3c5c0059140f0e6dc3836ab2b28fd1d +size 25192448 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..0991ac96fad5c0df60e3f6664835fe3664ff927a --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f29ef3fcc9ba8c66b7d85750451a1066cad22142876e0b0ad1dad6d6d626734 +size 25192448 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb8e8e71915ea867c4d1b5c75ca4c598dbc627ae --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3cb80fac56fa63595d204122751bc048a218f552b3525ee8666e3d5a1a5bb61 +size 25192448 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..955e937d196645c5763bcf8104e57f28284125d5 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15fe6e0782e6c7fcc2608a620bd532df2c01948210a0ae29a78fd26e08cc8848 +size 25192448 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..7919c7b9829e1cecca0a8e5eb0e7e524e13c0cc8 --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3a6b054e2b0fa6fac22c84b14f9e8e20095648e7fdf00f9659ade781f7e53c2 +size 25192448 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..4af783852328cc823db7ae61b6d2b62d2c94e322 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47d578479f438d9a57c130ecabbe1bae0bd7cdf78a9b875fd105cdfdca5322f5 +size 25192448 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..310e73a9a9d1729442af80e3938637b8c5284c7f --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df585ce2224a5d505f44d51a5fadead60e4c3b6297bffdfd738b41c457250915 +size 26767360 diff --git a/params_shard_9.bin b/params_shard_9.bin index cc744de269f2008da34eb5948537e0aed42aa0d1..d71851de7a53e40335040dd9b38407a8852b4d0a 100644 --- a/params_shard_9.bin +++ b/params_shard_9.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:639855512474625e121398ae0dae03a02a3774412bd74e78d42bbd1287c3efee +oid sha256:1a41f1f59cabdd24e0334e1a7984a22d44a48c7304f5569d6f7994cbd8e1bb7f size 30902272