diff --git "a/ndarray-cache.json" "b/ndarray-cache.json" --- "a/ndarray-cache.json" +++ "b/ndarray-cache.json" @@ -1,8 +1,8 @@ { "metadata": { - "ParamSize": 869, - "ParamBytes": 2334114368.0, - "BitsPerParam": 4.612736555784706 + "ParamSize": 724, + "ParamBytes": 2769074176.0, + "BitsPerParam": 5.4723152611665915 }, "records": [ { @@ -22,7 +22,7 @@ "byteOffset": 0 } ], - "md5sum": "03f42a0e4b7b45fb1af495013d415f70" + "md5sum": "d462bf6681cfdf3a155a33ec34995397" }, { "dataPath": "params_shard_1.bin", @@ -41,7 +41,7 @@ "byteOffset": 0 } ], - "md5sum": "c26c0bfa7471129355a632bdaceee085" + "md5sum": "44d1346cb8ecbad2a0225b6f8e6b6601" }, { "dataPath": "params_shard_2.bin", @@ -113,7 +113,7 @@ "byteOffset": 23463936 } ], - "md5sum": "c76c21adf2577acc8d5081f81635683e" + "md5sum": "d58b2bfe1a2018f50a2295a25b598203" }, { "dataPath": "params_shard_3.bin", @@ -132,7 +132,7 @@ "byteOffset": 0 } ], - "md5sum": "41e36be4010532f225910ab2da957df4" + "md5sum": "23f15d529480da9a0c42195b3916270f" }, { "dataPath": "params_shard_4.bin", @@ -215,7 +215,7 @@ "byteOffset": 33232896 } ], - "md5sum": "11fe3e24529e5d875b431ad76adbe6c6" + "md5sum": "f1e852dd01f75d353a308f918d7e042b" }, { "dataPath": "params_shard_5.bin", @@ -277,7 +277,7 @@ "byteOffset": 21233664 } ], - "md5sum": "db5de768c5c55cec34ee218899f883da" + "md5sum": "d1e46423910f8ff09fa2dea997c9df8a" }, { "dataPath": "params_shard_6.bin", @@ -296,7 +296,7 @@ "byteOffset": 0 } ], - "md5sum": "a7cf0e4fcf6869e0b96ea26b6952735a" + "md5sum": "019f500de4760aacd3ee30f87cf92f36" }, { "dataPath": "params_shard_7.bin", @@ -369,7 +369,7 @@ "byteOffset": 22026240 } ], - "md5sum": "f50a0ec8d5b4bc9f25ff5debd51c1210" + "md5sum": "0487a6f5169a8ec8731946ac438aca6f" }, { "dataPath": "params_shard_8.bin", @@ -388,7 +388,7 @@ "byteOffset": 0 } ], - "md5sum": "b3731b47d71ec2a2e1a621ce45bce622" + "md5sum": "4bd7aa0e240a5d3fe5cc4f04f0019851" }, { "dataPath": "params_shard_9.bin", @@ -471,7 +471,7 @@ "byteOffset": 33232896 } ], - "md5sum": "f4b6989d71a06160012b50345da2ab97" + "md5sum": "2d48bf11c0cfb3f138ef4e44e0bc8205" }, { "dataPath": "params_shard_10.bin", @@ -533,7 +533,7 @@ "byteOffset": 21233664 } ], - "md5sum": "c7b2fb1b7113e0d9e7ad802025d5a6fc" + "md5sum": "18c37a099b97287fa32ef12c06226d92" }, { "dataPath": "params_shard_11.bin", @@ -552,7 +552,7 @@ "byteOffset": 0 } ], - "md5sum": "dcc01e341ca10fefd9aac289c3960b97" + "md5sum": "6f715301d4fdbd2ed658ba3a86320f80" }, { "dataPath": "params_shard_12.bin", @@ -625,7 +625,7 @@ "byteOffset": 22026240 } ], - "md5sum": "8cb7f4afa1a3f347d0c443319a527b6a" + "md5sum": "f010e04f362de8344df9efd68dff17c5" }, { "dataPath": "params_shard_13.bin", @@ -644,7 +644,7 @@ "byteOffset": 0 } ], - "md5sum": "d4fe2733606e5a5c79372261fc28000f" + "md5sum": "f280ebae4a4dc4feaac07b649772118c" }, { "dataPath": "params_shard_14.bin", @@ -727,7 +727,7 @@ "byteOffset": 33232896 } ], - "md5sum": "5d76b6998116de6c8c8d5425a914df0f" + "md5sum": "d8dc46dad50b01ad80d76e32e5c4e872" }, { "dataPath": "params_shard_15.bin", @@ -789,7 +789,7 @@ "byteOffset": 21233664 } ], - "md5sum": "ef8fe2ffb42f9b91176fa4a9f11bb9de" + "md5sum": "bc99209d84c0f0887b53d173d95639dc" }, { "dataPath": "params_shard_16.bin", @@ -808,7 +808,7 @@ "byteOffset": 0 } ], - "md5sum": "9557dd078ae2cb230face8006995fcf7" + "md5sum": "f988ea3fd6c4ef0446d41f6489f8137d" }, { "dataPath": "params_shard_17.bin", @@ -881,7 +881,7 @@ "byteOffset": 22026240 } ], - "md5sum": "3baec0d24d4200875fc06af28c3fb0b8" + "md5sum": "a90dc6c7a0cd0ab22ac28efa49a37437" }, { "dataPath": "params_shard_18.bin", @@ -900,7 +900,7 @@ "byteOffset": 0 } ], - "md5sum": "65fbda0ea3fad96582fbcac92f4400fc" + "md5sum": "0367200ee6d724634eee64500b76e9f4" }, { "dataPath": "params_shard_19.bin", @@ -983,7 +983,7 @@ "byteOffset": 33232896 } ], - "md5sum": "75a0298eea85723412219cc9cb8016a4" + "md5sum": "e4e0d58bac3892d7466dc7a57d15b527" }, { "dataPath": "params_shard_20.bin", @@ -1045,7 +1045,7 @@ "byteOffset": 21233664 } ], - "md5sum": "c6b63b21d6d195d1b184b030c167b1c9" + "md5sum": "137ce81a2aef53ce819f2ddcba2662a9" }, { "dataPath": "params_shard_21.bin", @@ -1064,7 +1064,7 @@ "byteOffset": 0 } ], - "md5sum": "324d6fab6d373401073546ed03d39211" + "md5sum": "57f52a6294ba07ccfd40862302abfeb0" }, { "dataPath": "params_shard_22.bin", @@ -1137,7 +1137,7 @@ "byteOffset": 22026240 } ], - "md5sum": "8e042a2e177639cb2ff674f3a7266210" + "md5sum": "fb637e3862f096624612a89e5d550586" }, { "dataPath": "params_shard_23.bin", @@ -1156,7 +1156,7 @@ "byteOffset": 0 } ], - "md5sum": "e92a94d89f861c2c5e9d08f206b7bc1c" + "md5sum": "c4a2128471bb8163d1155d4428a3e096" }, { "dataPath": "params_shard_24.bin", @@ -1239,7 +1239,7 @@ "byteOffset": 33232896 } ], - "md5sum": "af4e357109ce0dd01c3ea75acb8aaa1a" + "md5sum": "8f46c0f65098b2f7150326e2032cad8e" }, { "dataPath": "params_shard_25.bin", @@ -1301,7 +1301,7 @@ "byteOffset": 21233664 } ], - "md5sum": "303caa4cee9e70c8bd1066464c2ea849" + "md5sum": "75acd30a2b79d831f7db532a8999a1f3" }, { "dataPath": "params_shard_26.bin", @@ -1320,7 +1320,7 @@ "byteOffset": 0 } ], - "md5sum": "70b2cf47e9e55432dd9088afd8e9a83e" + "md5sum": "8d06da6215b2c8aa873f4c228389f389" }, { "dataPath": "params_shard_27.bin", @@ -1393,7 +1393,7 @@ "byteOffset": 22026240 } ], - "md5sum": "c94a2d330f9cb37c8a61cf90deb0b45f" + "md5sum": "4f7f06d0c1fc498bcd4128e6a62b01ba" }, { "dataPath": "params_shard_28.bin", @@ -1412,7 +1412,7 @@ "byteOffset": 0 } ], - "md5sum": "b76a9a27c46ac52bddcd744b605564a9" + "md5sum": "dd4a9fc77672f3d4c5b29e3167fd4881" }, { "dataPath": "params_shard_29.bin", @@ -1495,7 +1495,7 @@ "byteOffset": 33232896 } ], - "md5sum": "fc3908ef1ff4fab5a81adf786477d8b4" + "md5sum": "86a3a85df8b0d7a1237d036a46ad6a8e" }, { "dataPath": "params_shard_30.bin", @@ -1557,7 +1557,7 @@ "byteOffset": 21233664 } ], - "md5sum": "3df7172b8ec78578295ca75338a0c32e" + "md5sum": "3f10adaed93c9b7fb821bc8b1f35659e" }, { "dataPath": "params_shard_31.bin", @@ -1576,7 +1576,7 @@ "byteOffset": 0 } ], - "md5sum": "bd5f5975f4b7f21f2554644da9da6f5a" + "md5sum": "6ddec1d838994a89efa5c5534a00f63a" }, { "dataPath": "params_shard_32.bin", @@ -1649,7 +1649,7 @@ "byteOffset": 22026240 } ], - "md5sum": "fb63daef7fca12dea591efd21b9d9c14" + "md5sum": "196b53103b396b64b908064f9984b4b7" }, { "dataPath": "params_shard_33.bin", @@ -1668,7 +1668,7 @@ "byteOffset": 0 } ], - "md5sum": "6511803dfb93c3e3ce95b0dd94e1270d" + "md5sum": "f913ba05408e86b44bc31f5a275e9cb1" }, { "dataPath": "params_shard_34.bin", @@ -1751,7 +1751,7 @@ "byteOffset": 33232896 } ], - "md5sum": "acd04c251a6a0b8a09fa648724078f9f" + "md5sum": "0ed9f2a3baa6009111345e9fd08c0fe8" }, { "dataPath": "params_shard_35.bin", @@ -1770,7 +1770,7 @@ "byteOffset": 0 } ], - "md5sum": "424943277254877ab0a7690d3839c6af" + "md5sum": "ba96aa7c1453daa5716bf285fc9e0332" }, { "dataPath": "params_shard_36.bin", @@ -1853,7 +1853,7 @@ "byteOffset": 27396096 } ], - "md5sum": "6e3c5ead604216089bb2bd02a4329a5a" + "md5sum": "956c42c6309a4a9e50ac3273a1dfe096" }, { "dataPath": "params_shard_37.bin", @@ -1872,7 +1872,7 @@ "byteOffset": 0 } ], - "md5sum": "044a1b344b2891ed7f019e9757264f23" + "md5sum": "70ec8bdbd4f6edee811b13e8382e6d31" }, { "dataPath": "params_shard_38.bin", @@ -1945,7 +1945,7 @@ "byteOffset": 22026240 } ], - "md5sum": "203e211d7b41621ac79a6cf68e143d10" + "md5sum": "30a7c74e2dabfffe2c79084684693ff9" }, { "dataPath": "params_shard_39.bin", @@ -1964,7 +1964,7 @@ "byteOffset": 0 } ], - "md5sum": "e85ef9ff37755c08ce31c1aa203216a6" + "md5sum": "19808d9fb46a8dbe89f96ef7fcbde15b" }, { "dataPath": "params_shard_40.bin", @@ -2047,7 +2047,7 @@ "byteOffset": 33232896 } ], - "md5sum": "315bdc92c799dd2d5e4f3d5f56606ab0" + "md5sum": "e9ce9615c09f57448e2ce79382a96f14" }, { "dataPath": "params_shard_41.bin", @@ -2109,7 +2109,7 @@ "byteOffset": 21233664 } ], - "md5sum": "54074992d6adab3a53bb5113104dc2a2" + "md5sum": "fc45420316ea727605be5d7e0ed8e9da" }, { "dataPath": "params_shard_42.bin", @@ -2128,7 +2128,7 @@ "byteOffset": 0 } ], - "md5sum": "583cf91ed8d73e29c53be3ba8e6b0157" + "md5sum": "7b52744731cd22ca6bf33ee27302e1e3" }, { "dataPath": "params_shard_43.bin", @@ -2201,7 +2201,7 @@ "byteOffset": 22026240 } ], - "md5sum": "6ec2356dc75920d46ae39ff75a61e327" + "md5sum": "7016666073af181d421de47db3cd2df4" }, { "dataPath": "params_shard_44.bin", @@ -2220,7 +2220,7 @@ "byteOffset": 0 } ], - "md5sum": "0c8fac4fdb901171c0687163c39bfb24" + "md5sum": "da8ffafadefa5bee6e92402a262c1591" }, { "dataPath": "params_shard_45.bin", @@ -2303,7 +2303,7 @@ "byteOffset": 33232896 } ], - "md5sum": "f04da33a046700d1fd0c52d1a748b20f" + "md5sum": "579ea893625576de7ec6c925c8e472a5" }, { "dataPath": "params_shard_46.bin", @@ -2365,7 +2365,7 @@ "byteOffset": 21233664 } ], - "md5sum": "94bce31b25ff3751bd949ee2651ff3b0" + "md5sum": "3e3a519e78b6d214c6935bf47d9fd6da" }, { "dataPath": "params_shard_47.bin", @@ -2384,7 +2384,7 @@ "byteOffset": 0 } ], - "md5sum": "deb5606d247d964e84946eb2acf96f17" + "md5sum": "01263e0f52d5530fd5dcce9d6e558faf" }, { "dataPath": "params_shard_48.bin", @@ -2457,7 +2457,7 @@ "byteOffset": 22026240 } ], - "md5sum": "147b605c605618800546ef40d9f7dfd9" + "md5sum": "df492083954171dd0f29c8347415ad4c" }, { "dataPath": "params_shard_49.bin", @@ -2476,7 +2476,7 @@ "byteOffset": 0 } ], - "md5sum": "c9e508bb9637f442a61701f39953c947" + "md5sum": "26e9da272c07b9e3164ee39204001b1a" }, { "dataPath": "params_shard_50.bin", @@ -2559,7 +2559,7 @@ "byteOffset": 33232896 } ], - "md5sum": "54e8325797a3869da3e17f7137347f37" + "md5sum": "515c4b3a001119843a14b1ebb186f53e" }, { "dataPath": "params_shard_51.bin", @@ -2621,7 +2621,7 @@ "byteOffset": 21233664 } ], - "md5sum": "d2df7b8d4d0a89dd25e2c890d09ba7ac" + "md5sum": "e852ade5c26bd91ab0fa82467a3777c6" }, { "dataPath": "params_shard_52.bin", @@ -2640,7 +2640,7 @@ "byteOffset": 0 } ], - "md5sum": "8f64903fe513470efaea44cb44882554" + "md5sum": "0adac2bada661247eab94698103f825d" }, { "dataPath": "params_shard_53.bin", @@ -2713,7 +2713,7 @@ "byteOffset": 22026240 } ], - "md5sum": "3aa4555b974bea81381743734646ac6f" + "md5sum": "4a35f0ddaaab6863a2c5a3e4a407a249" }, { "dataPath": "params_shard_54.bin", @@ -2732,7 +2732,7 @@ "byteOffset": 0 } ], - "md5sum": "9bdaa9ffa45dbeba3f15230433248a45" + "md5sum": "9c9045251d6bd64178aee3423ba02d53" }, { "dataPath": "params_shard_55.bin", @@ -2815,7 +2815,7 @@ "byteOffset": 33232896 } ], - "md5sum": "a4838335ebbe75771cf31aee80e9386b" + "md5sum": "678735984da6a7c65a985ea9bcdd9e1d" }, { "dataPath": "params_shard_56.bin", @@ -2877,7 +2877,7 @@ "byteOffset": 21233664 } ], - "md5sum": "54597a723cf21d0eef770522979d21ba" + "md5sum": "6faf93f32ebae44e2316776e943b73d5" }, { "dataPath": "params_shard_57.bin", @@ -2896,7 +2896,7 @@ "byteOffset": 0 } ], - "md5sum": "55c07771f9d95822295047a776e4e716" + "md5sum": "7c906b3f2d0a23b4b404f384ada6c863" }, { "dataPath": "params_shard_58.bin", @@ -2969,7 +2969,7 @@ "byteOffset": 22026240 } ], - "md5sum": "e292be869f50f3f22711ede0efca8e99" + "md5sum": "d5a7ef52b511ca5c6607c93718976580" }, { "dataPath": "params_shard_59.bin", @@ -2988,7 +2988,7 @@ "byteOffset": 0 } ], - "md5sum": "fc5c9bf4993163454cac074473ec84ff" + "md5sum": "7835aa22e5fc3ab43904a7ba317dd05e" }, { "dataPath": "params_shard_60.bin", @@ -3071,7 +3071,7 @@ "byteOffset": 33232896 } ], - "md5sum": "35b09aad431916ab9986914db9feaa15" + "md5sum": "97c2f05f64c9839ba60e57e830c919e6" }, { "dataPath": "params_shard_61.bin", @@ -3155,7 +3155,7 @@ "byteOffset": 26542080 } ], - "md5sum": "d612bf0a65838fe9cd7c5338b0ab2d1a" + "md5sum": "8f2cc14e740a795d3945a92bca16366a" }, { "dataPath": "params_shard_62.bin", @@ -3174,7 +3174,7 @@ "byteOffset": 0 } ], - "md5sum": "a334b0a59263051527b3959507c2059f" + "md5sum": "56f2f22839c6b77063e3a90f30122137" }, { "dataPath": "params_shard_63.bin", @@ -3247,7 +3247,7 @@ "byteOffset": 22026240 } ], - "md5sum": "ff92efa38feb0013fbeeeb24a6beb6a2" + "md5sum": "f69a2221a90921e660620770b711fd17" }, { "dataPath": "params_shard_64.bin", @@ -3266,7 +3266,7 @@ "byteOffset": 0 } ], - "md5sum": "1030ee4948f7cc79712705800b13e010" + "md5sum": "c6e8789cf22bfb7a983b1834e983dd6e" }, { "dataPath": "params_shard_65.bin", @@ -3349,7 +3349,7 @@ "byteOffset": 33232896 } ], - "md5sum": "1d2e26f38ce827dce9e614d53fbae96b" + "md5sum": "0273ecef5ee3e36de92d20e60a6091a0" }, { "dataPath": "params_shard_66.bin", @@ -3411,7 +3411,7 @@ "byteOffset": 21233664 } ], - "md5sum": "5d4f870aa25b56a966e21e557b6a5689" + "md5sum": "5026939da604c97430a95d2026bb282c" }, { "dataPath": "params_shard_67.bin", @@ -3430,7 +3430,7 @@ "byteOffset": 0 } ], - "md5sum": "b8512fae8f93fbd9f4f7f73337311990" + "md5sum": "6c825a7113de38b7e100f9e7f45fc976" }, { "dataPath": "params_shard_68.bin", @@ -3503,7 +3503,7 @@ "byteOffset": 22026240 } ], - "md5sum": "dca262e67f5875824b6cb19b77b87f2b" + "md5sum": "e8545eb30fe53e7a9809bcbc52e5edc7" }, { "dataPath": "params_shard_69.bin", @@ -3522,7 +3522,7 @@ "byteOffset": 0 } ], - "md5sum": "95e02febe339e87fd2dc66e8720d5724" + "md5sum": "1bb546cc943cea45bd5a83dca1919c16" }, { "dataPath": "params_shard_70.bin", @@ -3605,7 +3605,7 @@ "byteOffset": 33232896 } ], - "md5sum": "9ffc11f2725ba1a6a50397edb5970b7b" + "md5sum": "3c5add49f666f50d75e351c3758271f1" }, { "dataPath": "params_shard_71.bin", @@ -3667,7 +3667,7 @@ "byteOffset": 21233664 } ], - "md5sum": "b82024bf6121748baaa0b2e15f45292a" + "md5sum": "b9817824fd05540c9968991b4973535f" }, { "dataPath": "params_shard_72.bin", @@ -3686,7 +3686,7 @@ "byteOffset": 0 } ], - "md5sum": "74351377410f94f98f638d90086a3ba3" + "md5sum": "2cbf2b759939a9c467cdcd7a35ba6ce7" }, { "dataPath": "params_shard_73.bin", @@ -3759,7 +3759,7 @@ "byteOffset": 22026240 } ], - "md5sum": "8fcac7f6ef447f7857682429ee194f8c" + "md5sum": "3f972e64e6d289c178af439b37093a27" }, { "dataPath": "params_shard_74.bin", @@ -3778,7 +3778,7 @@ "byteOffset": 0 } ], - "md5sum": "92d2cc1b281e6bb28f465b49ff9b208c" + "md5sum": "a2f722107d2de12aa1644399cd04810a" }, { "dataPath": "params_shard_75.bin", @@ -3861,7 +3861,7 @@ "byteOffset": 33232896 } ], - "md5sum": "5db69c637c72f53238fa9c6f55f2d4ef" + "md5sum": "c6eaaee1e69bfad8b25eaac488987947" }, { "dataPath": "params_shard_76.bin", @@ -3923,7 +3923,7 @@ "byteOffset": 21233664 } ], - "md5sum": "18aac3937281d4613c4bebe4fef0e9f5" + "md5sum": "83155bcc2223493f6ca1afce08a7e233" }, { "dataPath": "params_shard_77.bin", @@ -3942,7 +3942,7 @@ "byteOffset": 0 } ], - "md5sum": "e6cfafe2fc17539ef7a158a9c123d35c" + "md5sum": "aa3e3bbca10469c352e931114e4352e5" }, { "dataPath": "params_shard_78.bin", @@ -4015,7 +4015,7 @@ "byteOffset": 22026240 } ], - "md5sum": "d095dac880afc3e18c3ce261f3fa747e" + "md5sum": "11036296e1ab0f3fc2aad53eea717d1d" }, { "dataPath": "params_shard_79.bin", @@ -4034,7 +4034,7 @@ "byteOffset": 0 } ], - "md5sum": "ced88ec5fc5b74c9a3131e2cbc474bc9" + "md5sum": "698469bf0d9056a98e7b4b95100337ce" }, { "dataPath": "params_shard_80.bin", @@ -4117,12 +4117,12 @@ "byteOffset": 33232896 } ], - "md5sum": "62a16d6f9c5485e7c09d371f33dd08d3" + "md5sum": "72d7706eb3e77d679c1a21db987444f9" }, { "dataPath": "params_shard_81.bin", "format": "raw-shard", - "nbytes": 32262720, + "nbytes": 32036864, "records": [ { "name": "model.h.9.mixer.out_proj.q_weight", @@ -4204,26 +4204,15 @@ "byteOffset": 21243904 }, { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.weight", "shape": [ 577, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 295424, - "byteOffset": 22448128 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_scale", - "shape": [ - 577, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 36928, - "byteOffset": 22743552 + "nbytes": 1181696, + "byteOffset": 22448128 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.bias", @@ -4233,7 +4222,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22780480 + "byteOffset": 23629824 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.weight", @@ -4243,7 +4232,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22782528 + "byteOffset": 23631872 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.bias", @@ -4253,7 +4242,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22784576 + "byteOffset": 23633920 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.weight", @@ -4263,7 +4252,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22786624 + "byteOffset": 23635968 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.bias", @@ -4273,29 +4262,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 22788672 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 22796864 + "byteOffset": 23638016 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 24894016 + "nbytes": 8388608, + "byteOffset": 23646208 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.bias", @@ -4305,29 +4283,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25156160 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 25158208 - }, + "byteOffset": 32034816 + } + ], + "md5sum": "06eb2520ad6b2dfb6527b035312460c8" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 27255360 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.bias", @@ -4337,29 +4312,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27517504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27519552 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28043840 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.bias", @@ -4369,29 +4333,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28109376 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 28111424 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28635712 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.bias", @@ -4401,29 +4354,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28701248 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 28703296 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 29227584 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.bias", @@ -4433,29 +4375,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29293120 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 29295168 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 29819456 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.bias", @@ -4465,7 +4396,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29884992 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.weight", @@ -4475,7 +4406,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29887040 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.bias", @@ -4485,7 +4416,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29889088 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.weight", @@ -4495,7 +4426,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29891136 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.bias", @@ -4505,29 +4436,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 29893184 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 29901376 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 31998528 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.bias", @@ -4537,37 +4457,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32260672 + "byteOffset": 25190400 } ], - "md5sum": "f31749651cdc2e1f7cb48008e11e163a" + "md5sum": "12ccc3786467895471d31bb5b1d2610c" }, { - "dataPath": "params_shard_82.bin", + "dataPath": "params_shard_83.bin", "format": "raw-shard", - "nbytes": 33161216, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.bias", @@ -4577,29 +4486,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2361344 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 2885632 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.bias", @@ -4609,29 +4507,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2951168 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2953216 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 3477504 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.bias", @@ -4641,29 +4528,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3543040 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 3545088 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4069376 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.bias", @@ -4673,29 +4549,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4134912 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4136960 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4661248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.bias", @@ -4705,7 +4570,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4726784 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.weight", @@ -4715,7 +4580,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4728832 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.bias", @@ -4725,7 +4590,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4730880 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.weight", @@ -4735,7 +4600,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4732928 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.bias", @@ -4745,29 +4610,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 4734976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 4743168 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 6840320 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.bias", @@ -4777,29 +4631,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7102464 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "dcc2adf61aa07fe189bb15874110e845" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.bias", @@ -4809,29 +4660,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 9465856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 9990144 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.bias", @@ -4841,29 +4681,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10055680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10057728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 10582016 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.bias", @@ -4873,29 +4702,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10647552 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10649600 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11173888 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.bias", @@ -4905,29 +4723,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11239424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11241472 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11765760 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.bias", @@ -4937,7 +4744,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11831296 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.weight", @@ -4947,7 +4754,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11833344 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.bias", @@ -4957,7 +4764,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11835392 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.weight", @@ -4967,7 +4774,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11837440 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.bias", @@ -4977,29 +4784,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 11839488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 11847680 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 13944832 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.bias", @@ -5009,29 +4805,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14206976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "9f8d49d8894a05f4179ba707925e9d59" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.bias", @@ -5041,29 +4834,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 16570368 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17094656 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.bias", @@ -5073,29 +4855,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17160192 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17162240 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17686528 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.bias", @@ -5105,29 +4876,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17752064 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17754112 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18278400 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.bias", @@ -5137,29 +4897,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18343936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18345984 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18870272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.bias", @@ -5169,7 +4918,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18935808 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.weight", @@ -5179,7 +4928,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18937856 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.bias", @@ -5189,7 +4938,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18939904 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.weight", @@ -5199,7 +4948,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18941952 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.bias", @@ -5209,29 +4958,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18944000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 18952192 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 21049344 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.bias", @@ -5241,29 +4979,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21311488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "19b6f5d2cfc839108f9156b8b521d3ce" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.bias", @@ -5273,29 +5008,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 23674880 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24199168 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.bias", @@ -5305,29 +5029,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24264704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24266752 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24791040 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.bias", @@ -5337,29 +5050,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24856576 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24858624 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25382912 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.bias", @@ -5369,29 +5071,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25448448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 25450496 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25974784 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.bias", @@ -5401,7 +5092,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26040320 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.weight", @@ -5411,7 +5102,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26042368 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.bias", @@ -5421,7 +5112,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26044416 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.weight", @@ -5431,7 +5122,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26046464 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.bias", @@ -5441,29 +5132,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 26048512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 26056704 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 28153856 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.bias", @@ -5473,29 +5153,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28416000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 28418048 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "3e6322c0673873144d67964c709fa3be" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 30515200 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.bias", @@ -5505,29 +5182,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30777344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 30779392 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31303680 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.bias", @@ -5537,29 +5203,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31369216 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31371264 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31895552 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.bias", @@ -5569,29 +5224,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31961088 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31963136 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 32487424 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.bias", @@ -5601,29 +5245,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32552960 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 32555008 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 33079296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.bias", @@ -5633,7 +5266,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33144832 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.weight", @@ -5643,7 +5276,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33146880 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.bias", @@ -5653,7 +5286,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33148928 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.weight", @@ -5663,7 +5296,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33150976 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.bias", @@ -5673,37 +5306,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 33153024 - } - ], - "md5sum": "f08b634e46a63d50279fc8be715cd065" - }, - { - "dataPath": "params_shard_83.bin", - "format": "raw-shard", - "nbytes": 33140736, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.bias", @@ -5713,29 +5327,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 2361344 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "f04370015a40ae2073f5d89ad86f1c42" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 4458496 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.bias", @@ -5745,29 +5356,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4720640 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4722688 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5246976 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.bias", @@ -5777,29 +5377,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5312512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5314560 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5838848 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.bias", @@ -5809,29 +5398,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5904384 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5906432 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 6430720 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.bias", @@ -5841,29 +5419,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6496256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 6498304 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 7022592 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.bias", @@ -5873,7 +5440,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7088128 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.weight", @@ -5883,7 +5450,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7090176 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.bias", @@ -5893,7 +5460,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7092224 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.weight", @@ -5903,7 +5470,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7094272 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.bias", @@ -5913,29 +5480,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 7096320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.bias", @@ -5945,29 +5501,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 9465856 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e2c99d455ee851ede30d282481166453" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 11563008 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.bias", @@ -5977,29 +5530,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11825152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11827200 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12351488 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.bias", @@ -6009,29 +5551,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12417024 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 12419072 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12943360 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.bias", @@ -6041,29 +5572,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13008896 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13010944 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 13535232 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.bias", @@ -6073,29 +5593,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13600768 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13602816 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 14127104 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.bias", @@ -6105,7 +5614,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14192640 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.weight", @@ -6115,7 +5624,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14194688 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.bias", @@ -6125,7 +5634,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14196736 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.weight", @@ -6135,7 +5644,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14198784 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.bias", @@ -6145,29 +5654,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 14200832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.bias", @@ -6177,29 +5675,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 16570368 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "11c75f74757caccc61b9f6c3f39a9737" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 18667520 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.bias", @@ -6209,29 +5704,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18929664 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18931712 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 19456000 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.bias", @@ -6241,29 +5725,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19521536 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 19523584 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20047872 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.bias", @@ -6273,29 +5746,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20113408 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20115456 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20639744 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.bias", @@ -6305,29 +5767,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20705280 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20707328 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 21231616 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.bias", @@ -6337,7 +5788,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21297152 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.weight", @@ -6347,7 +5798,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21299200 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.bias", @@ -6357,7 +5808,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21301248 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.weight", @@ -6367,7 +5818,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21303296 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.bias", @@ -6377,29 +5828,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 21305344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.bias", @@ -6409,29 +5849,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 23674880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "a7f57fd25793b85aa6027a514efc39fb" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 25772032 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.bias", @@ -6441,29 +5878,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26034176 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26036224 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 26560512 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.bias", @@ -6473,29 +5899,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26626048 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26628096 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27152384 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.bias", @@ -6505,29 +5920,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27217920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27219968 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27744256 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.bias", @@ -6537,29 +5941,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27809792 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27811840 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28336128 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.bias", @@ -6569,7 +5962,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28401664 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.weight", @@ -6579,7 +5972,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28403712 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.bias", @@ -6589,7 +5982,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28405760 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.weight", @@ -6599,7 +5992,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28407808 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.bias", @@ -6609,29 +6002,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 28409856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 28418048 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 30515200 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.bias", @@ -6641,29 +6023,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30777344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 30779392 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e13228942bc433e638fe3903001715f3" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 32876544 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.bias", @@ -6673,37 +6052,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33138688 - } - ], - "md5sum": "a0e8309f607c57253603f2ffd504cce4" - }, - { - "dataPath": "params_shard_84.bin", - "format": "raw-shard", - "nbytes": 33161216, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 0 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 524288 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.bias", @@ -6713,29 +6073,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 589824 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 591872 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 1116160 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.bias", @@ -6745,29 +6094,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1181696 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 1183744 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 1708032 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.bias", @@ -6777,29 +6115,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1773568 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 1775616 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 2299904 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.bias", @@ -6809,7 +6136,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2365440 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.weight", @@ -6819,7 +6146,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2367488 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.bias", @@ -6829,7 +6156,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2369536 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.weight", @@ -6839,7 +6166,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2371584 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.bias", @@ -6849,29 +6176,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 2373632 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.weight", "shape": [ 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 2381824 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_scale", - "shape": [ - 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 4478976 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.bias", @@ -6881,29 +6197,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4741120 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 4743168 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "eab0a6fc1a1e3beac991a0be01fdefe8" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 6840320 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.bias", @@ -6913,29 +6226,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7102464 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 7104512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 7628800 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.bias", @@ -6945,29 +6247,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7694336 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 7696384 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 8220672 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.bias", @@ -6977,29 +6268,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8286208 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 8288256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 8812544 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.bias", @@ -7009,29 +6289,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8878080 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 8880128 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 9404416 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.bias", @@ -7041,7 +6310,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9469952 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.weight", @@ -7051,7 +6320,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9472000 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.bias", @@ -7061,7 +6330,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9474048 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.weight", @@ -7071,7 +6340,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9476096 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.bias", @@ -7081,29 +6350,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 9478144 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 9486336 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 11583488 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.bias", @@ -7113,29 +6371,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11845632 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 11847680 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "afcfd0263f305fcc63e7b86393753bf7" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 13944832 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.bias", @@ -7145,29 +6400,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14206976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 14209024 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 14733312 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.bias", @@ -7177,29 +6421,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14798848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 14800896 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 15325184 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.bias", @@ -7209,29 +6442,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15390720 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 15392768 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 15917056 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.bias", @@ -7241,29 +6463,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15982592 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 15984640 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 16508928 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.bias", @@ -7273,7 +6484,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16574464 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.weight", @@ -7283,7 +6494,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16576512 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.bias", @@ -7293,145 +6504,109 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16578560 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.weight", - "shape": [ - 1024 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 16580608 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.bias", - "shape": [ - 4096 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 8192, - "byteOffset": 16582656 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 16590848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_scale", - "shape": [ - 4096, - 32 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 18688000 + "byteOffset": 16789504 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.weight", "shape": [ 1024 ], "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18950144 + "byteOffset": 16791552 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.bias", "shape": [ - 1024, - 512 + 4096 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 18952192 + "nbytes": 8192, + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.weight", "shape": [ - 1024, - 128 + 4096, + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 21049344 + "nbytes": 8388608, + "byteOffset": 16801792 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.bias", "shape": [ 1024 ], "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21311488 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "460a8bc76edf812f85886ec9f950f395" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 21313536 + "nbytes": 8388608, + "byteOffset": 0 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.bias", "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 21837824 + "nbytes": 2048, + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.weight", "shape": [ + 1024, 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 21903360 + "nbytes": 2097152, + "byteOffset": 8390656 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.bias", "shape": [ - 1024, - 128 + 1024 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 21905408 + "nbytes": 2048, + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 22429696 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.bias", @@ -7441,29 +6616,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22495232 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 22497280 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 23021568 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.bias", @@ -7473,29 +6637,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23087104 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 23089152 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 23613440 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.bias", @@ -7505,7 +6658,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23678976 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.weight", @@ -7515,7 +6668,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23681024 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.bias", @@ -7525,7 +6678,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23683072 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.weight", @@ -7535,7 +6688,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23685120 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.bias", @@ -7545,29 +6698,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 23687168 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 23695360 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 25792512 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.bias", @@ -7577,29 +6719,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26054656 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 26056704 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "bcac984764bba0a4eb9891d2043e1d89" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 28153856 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.bias", @@ -7609,29 +6748,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28416000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 28418048 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28942336 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.bias", @@ -7641,29 +6769,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29007872 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 29009920 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 29534208 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.bias", @@ -7673,29 +6790,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29599744 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 29601792 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 30126080 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.bias", @@ -7705,29 +6811,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30191616 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 30193664 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 30717952 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.bias", @@ -7737,7 +6832,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30783488 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.weight", @@ -7747,7 +6842,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30785536 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.bias", @@ -7757,7 +6852,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30787584 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.weight", @@ -7767,7 +6862,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30789632 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.bias", @@ -7777,29 +6872,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 30791680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 30799872 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 32897024 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.bias", @@ -7809,37 +6893,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33159168 + "byteOffset": 25190400 } ], - "md5sum": "10ad505e9ab90b00640b5382d9bb5582" + "md5sum": "3197e582d745d84c2ab4347a1f2d4e2d" }, { - "dataPath": "params_shard_85.bin", + "dataPath": "params_shard_97.bin", "format": "raw-shard", - "nbytes": 33161216, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.bias", @@ -7849,29 +6922,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2361344 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 2885632 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.bias", @@ -7881,29 +6943,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2951168 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2953216 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 3477504 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.bias", @@ -7913,29 +6964,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3543040 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 3545088 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4069376 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.bias", @@ -7945,29 +6985,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4134912 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4136960 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4661248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.bias", @@ -7977,7 +7006,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4726784 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.weight", @@ -7987,7 +7016,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4728832 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.bias", @@ -7997,7 +7026,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4730880 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.weight", @@ -8007,7 +7036,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4732928 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.bias", @@ -8017,29 +7046,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 4734976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 4743168 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 6840320 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.bias", @@ -8049,29 +7067,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7102464 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e6d67ae9f4dab5ea49fac79bceac7a86" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.bias", @@ -8081,29 +7096,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 9465856 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 9990144 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.bias", @@ -8113,29 +7117,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10055680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10057728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 10582016 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.bias", @@ -8144,30 +7137,19 @@ ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 10647552 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10649600 + "nbytes": 2048, + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11173888 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.bias", @@ -8177,29 +7159,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11239424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11241472 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11765760 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.bias", @@ -8209,7 +7180,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11831296 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.weight", @@ -8219,7 +7190,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11833344 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.bias", @@ -8229,7 +7200,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11835392 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.weight", @@ -8239,7 +7210,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11837440 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.bias", @@ -8249,29 +7220,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 11839488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 11847680 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 13944832 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.bias", @@ -8281,29 +7241,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14206976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "1a74510bf14d6fc06b53f09ee6a22fdd" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.bias", @@ -8313,29 +7270,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 16570368 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17094656 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.bias", @@ -8345,29 +7291,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17160192 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17162240 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17686528 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.bias", @@ -8377,29 +7312,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17752064 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17754112 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18278400 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.bias", @@ -8409,29 +7333,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18343936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18345984 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18870272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.bias", @@ -8441,7 +7354,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18935808 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.weight", @@ -8451,7 +7364,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18937856 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.bias", @@ -8461,7 +7374,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18939904 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.weight", @@ -8471,7 +7384,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18941952 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.bias", @@ -8481,29 +7394,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18944000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 18952192 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 21049344 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.bias", @@ -8513,29 +7415,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21311488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "75a9ee23e852e5562e2176a5ece04f24" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.bias", @@ -8545,29 +7444,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 23674880 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24199168 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.bias", @@ -8577,29 +7465,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24264704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24266752 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24791040 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.bias", @@ -8609,29 +7486,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24856576 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24858624 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25382912 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.bias", @@ -8641,29 +7507,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25448448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 25450496 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25974784 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.bias", @@ -8673,7 +7528,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26040320 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.weight", @@ -8683,7 +7538,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26042368 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.bias", @@ -8693,7 +7548,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26044416 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.weight", @@ -8703,7 +7558,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26046464 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.bias", @@ -8713,29 +7568,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 26048512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 26056704 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 28153856 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.bias", @@ -8745,29 +7589,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28416000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 28418048 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "da3f4d64dad38aa57a47fd6fbca1a334" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 30515200 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.bias", @@ -8777,29 +7618,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30777344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 30779392 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31303680 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.bias", @@ -8809,29 +7639,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31369216 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31371264 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31895552 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.bias", @@ -8841,29 +7660,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31961088 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31963136 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 32487424 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.bias", @@ -8873,29 +7681,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32552960 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 32555008 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 33079296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.bias", @@ -8905,7 +7702,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33144832 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.weight", @@ -8915,7 +7712,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33146880 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.bias", @@ -8925,7 +7722,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33148928 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.weight", @@ -8935,7 +7732,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33150976 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.bias", @@ -8945,37 +7742,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 33153024 - } - ], - "md5sum": "16f33cc460696f29368f48352e15c0cb" - }, - { - "dataPath": "params_shard_86.bin", - "format": "raw-shard", - "nbytes": 28416000, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.bias", @@ -8985,29 +7763,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 2361344 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "ca1eb7481171d37cc9fab4b3432d81d1" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 4458496 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.bias", @@ -9017,29 +7792,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4720640 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4722688 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5246976 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.bias", @@ -9049,29 +7813,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5312512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5314560 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5838848 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.bias", @@ -9081,29 +7834,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5904384 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5906432 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 6430720 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.bias", @@ -9113,29 +7855,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6496256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 6498304 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 7022592 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.bias", @@ -9145,7 +7876,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7088128 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.weight", @@ -9155,7 +7886,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7090176 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.bias", @@ -9165,7 +7896,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7092224 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.weight", @@ -9175,7 +7906,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7094272 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.bias", @@ -9185,29 +7916,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 7096320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.bias", @@ -9217,29 +7937,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 9465856 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "03be4317a6855a15625866d5dde56763" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 11563008 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.bias", @@ -9249,29 +7966,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11825152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11827200 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12351488 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.bias", @@ -9281,29 +7987,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12417024 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 12419072 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12943360 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.bias", @@ -9313,29 +8008,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13008896 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13010944 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 13535232 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.bias", @@ -9345,29 +8029,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13600768 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13602816 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 14127104 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.bias", @@ -9377,7 +8050,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14192640 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.weight", @@ -9387,7 +8060,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14194688 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.bias", @@ -9397,7 +8070,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14196736 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.weight", @@ -9407,7 +8080,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14198784 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.bias", @@ -9417,29 +8090,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 14200832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.bias", @@ -9449,29 +8111,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 16570368 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "7464cccd529310def6e3920c637ad62c" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 18667520 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.bias", @@ -9481,29 +8140,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18929664 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18931712 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 19456000 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.bias", @@ -9513,29 +8161,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19521536 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 19523584 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20047872 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.bias", @@ -9545,29 +8182,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20113408 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20115456 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20639744 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.bias", @@ -9577,29 +8203,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20705280 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20707328 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 21231616 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.bias", @@ -9609,7 +8224,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21297152 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.weight", @@ -9619,7 +8234,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21299200 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.bias", @@ -9629,7 +8244,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21301248 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.weight", @@ -9639,7 +8254,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21303296 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.bias", @@ -9649,29 +8264,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 21305344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.bias", @@ -9681,29 +8285,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 23674880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "8be48481c922751c9b723a99e5dcd727" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 29200384, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 25772032 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.bias", @@ -9713,29 +8314,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26034176 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26036224 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 26560512 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.bias", @@ -9745,29 +8335,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26626048 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26628096 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27152384 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.bias", @@ -9777,29 +8356,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27217920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27219968 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27744256 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.bias", @@ -9809,29 +8377,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27809792 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27811840 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28336128 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.bias", @@ -9841,7 +8398,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28401664 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.weight", @@ -9851,7 +8408,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28403712 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.bias", @@ -9861,7 +8418,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28405760 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.weight", @@ -9871,7 +8428,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28407808 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_projection.linear_1.bias", @@ -9881,16 +8438,8 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 28409856 - } - ], - "md5sum": "027e3a724b350d7591cb6ed3fc9ec2a0" - }, - { - "dataPath": "params_shard_87.bin", - "format": "raw-shard", - "nbytes": 12400640, - "records": [ + "byteOffset": 16793600 + }, { "name": "vision_embed_tokens.img_projection.linear_1.q_weight", "shape": [ @@ -9900,7 +8449,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 6291456, - "byteOffset": 0 + "byteOffset": 16799744 }, { "name": "vision_embed_tokens.img_projection.linear_1.q_scale", @@ -9911,7 +8460,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 786432, - "byteOffset": 6291456 + "byteOffset": 23091200 }, { "name": "vision_embed_tokens.img_projection.linear_2.bias", @@ -9921,7 +8470,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 7077888 + "byteOffset": 23877632 }, { "name": "vision_embed_tokens.img_projection.linear_2.q_weight", @@ -9932,7 +8481,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 4718592, - "byteOffset": 7084032 + "byteOffset": 23883776 }, { "name": "vision_embed_tokens.img_projection.linear_2.q_scale", @@ -9943,7 +8492,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 589824, - "byteOffset": 11802624 + "byteOffset": 28602368 }, { "name": "vision_embed_tokens.sub_GN", @@ -9956,10 +8505,10 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 12392448 + "byteOffset": 29192192 } ], - "md5sum": "3ea1e6cf6a4c4b7f0a2f46b23a3d754d" + "md5sum": "927d59a5c381146b42f03e5e1f514411" } ] } \ No newline at end of file