diff --git a/mlc-chat-config.json b/mlc-chat-config.json index 3a05cbc785b8c8fade678b1d3aadf5d104f381fa..23fb1e14fef6a0dce77d7a777a890cbeda1d806a 100644 --- a/mlc-chat-config.json +++ b/mlc-chat-config.json @@ -140,15 +140,15 @@ }, "original_max_position_embeddings": 4096, "context_window_size": 131072, - "prefill_chunk_size": 2048, + "prefill_chunk_size": 8192, "head_dim": 96, "tensor_parallel_shards": 1, - "max_batch_size": 80 + "max_batch_size": 128 }, "vocab_size": 32064, "context_window_size": 131072, "sliding_window_size": -1, - "prefill_chunk_size": 2048, + "prefill_chunk_size": 8192, "attention_sink_size": -1, "tensor_parallel_shards": 1, "pipeline_parallel_stages": 1, diff --git a/ndarray-cache.json b/ndarray-cache.json index 1ee20a0cc00dd5977d515719f3f9f2c72ee48caa..5906d1b081b6b2665bd60eba3dfef767e28dda82 100644 --- a/ndarray-cache.json +++ b/ndarray-cache.json @@ -1,8 +1,8 @@ { "metadata": { - "ParamSize": 869, - "ParamBytes": 2334114368.0, - "BitsPerParam": 4.612736555784706 + "ParamSize": 724, + "ParamBytes": 2769074176.0, + "BitsPerParam": 5.4723152611665915 }, "records": [ { @@ -22,7 +22,7 @@ "byteOffset": 0 } ], - "md5sum": "03f42a0e4b7b45fb1af495013d415f70" + "md5sum": "d462bf6681cfdf3a155a33ec34995397" }, { "dataPath": "params_shard_1.bin", @@ -41,7 +41,7 @@ "byteOffset": 0 } ], - "md5sum": "c26c0bfa7471129355a632bdaceee085" + "md5sum": "44d1346cb8ecbad2a0225b6f8e6b6601" }, { "dataPath": "params_shard_2.bin", @@ -113,7 +113,7 @@ "byteOffset": 23463936 } ], - "md5sum": "c76c21adf2577acc8d5081f81635683e" + "md5sum": "d58b2bfe1a2018f50a2295a25b598203" }, { "dataPath": "params_shard_3.bin", @@ -132,7 +132,7 @@ "byteOffset": 0 } ], - "md5sum": "41e36be4010532f225910ab2da957df4" + "md5sum": "23f15d529480da9a0c42195b3916270f" }, { "dataPath": "params_shard_4.bin", @@ -215,7 +215,7 @@ "byteOffset": 33232896 } ], - "md5sum": "11fe3e24529e5d875b431ad76adbe6c6" + "md5sum": "f1e852dd01f75d353a308f918d7e042b" }, { "dataPath": "params_shard_5.bin", @@ -277,7 +277,7 @@ "byteOffset": 21233664 } ], - "md5sum": "db5de768c5c55cec34ee218899f883da" + "md5sum": "d1e46423910f8ff09fa2dea997c9df8a" }, { "dataPath": "params_shard_6.bin", @@ -296,7 +296,7 @@ "byteOffset": 0 } ], - "md5sum": "a7cf0e4fcf6869e0b96ea26b6952735a" + "md5sum": "019f500de4760aacd3ee30f87cf92f36" }, { "dataPath": "params_shard_7.bin", @@ -369,7 +369,7 @@ "byteOffset": 22026240 } ], - "md5sum": "f50a0ec8d5b4bc9f25ff5debd51c1210" + "md5sum": "0487a6f5169a8ec8731946ac438aca6f" }, { "dataPath": "params_shard_8.bin", @@ -388,7 +388,7 @@ "byteOffset": 0 } ], - "md5sum": "b3731b47d71ec2a2e1a621ce45bce622" + "md5sum": "4bd7aa0e240a5d3fe5cc4f04f0019851" }, { "dataPath": "params_shard_9.bin", @@ -471,7 +471,7 @@ "byteOffset": 33232896 } ], - "md5sum": "f4b6989d71a06160012b50345da2ab97" + "md5sum": "2d48bf11c0cfb3f138ef4e44e0bc8205" }, { "dataPath": "params_shard_10.bin", @@ -533,7 +533,7 @@ "byteOffset": 21233664 } ], - "md5sum": "c7b2fb1b7113e0d9e7ad802025d5a6fc" + "md5sum": "18c37a099b97287fa32ef12c06226d92" }, { "dataPath": "params_shard_11.bin", @@ -552,7 +552,7 @@ "byteOffset": 0 } ], - "md5sum": "dcc01e341ca10fefd9aac289c3960b97" + "md5sum": "6f715301d4fdbd2ed658ba3a86320f80" }, { "dataPath": "params_shard_12.bin", @@ -625,7 +625,7 @@ "byteOffset": 22026240 } ], - "md5sum": "8cb7f4afa1a3f347d0c443319a527b6a" + "md5sum": "f010e04f362de8344df9efd68dff17c5" }, { "dataPath": "params_shard_13.bin", @@ -644,7 +644,7 @@ "byteOffset": 0 } ], - "md5sum": "d4fe2733606e5a5c79372261fc28000f" + "md5sum": "f280ebae4a4dc4feaac07b649772118c" }, { "dataPath": "params_shard_14.bin", @@ -727,7 +727,7 @@ "byteOffset": 33232896 } ], - "md5sum": "5d76b6998116de6c8c8d5425a914df0f" + "md5sum": "d8dc46dad50b01ad80d76e32e5c4e872" }, { "dataPath": "params_shard_15.bin", @@ -789,7 +789,7 @@ "byteOffset": 21233664 } ], - "md5sum": "ef8fe2ffb42f9b91176fa4a9f11bb9de" + "md5sum": "bc99209d84c0f0887b53d173d95639dc" }, { "dataPath": "params_shard_16.bin", @@ -808,7 +808,7 @@ "byteOffset": 0 } ], - "md5sum": "9557dd078ae2cb230face8006995fcf7" + "md5sum": "f988ea3fd6c4ef0446d41f6489f8137d" }, { "dataPath": "params_shard_17.bin", @@ -881,7 +881,7 @@ "byteOffset": 22026240 } ], - "md5sum": "3baec0d24d4200875fc06af28c3fb0b8" + "md5sum": "a90dc6c7a0cd0ab22ac28efa49a37437" }, { "dataPath": "params_shard_18.bin", @@ -900,7 +900,7 @@ "byteOffset": 0 } ], - "md5sum": "65fbda0ea3fad96582fbcac92f4400fc" + "md5sum": "0367200ee6d724634eee64500b76e9f4" }, { "dataPath": "params_shard_19.bin", @@ -983,7 +983,7 @@ "byteOffset": 33232896 } ], - "md5sum": "75a0298eea85723412219cc9cb8016a4" + "md5sum": "e4e0d58bac3892d7466dc7a57d15b527" }, { "dataPath": "params_shard_20.bin", @@ -1045,7 +1045,7 @@ "byteOffset": 21233664 } ], - "md5sum": "c6b63b21d6d195d1b184b030c167b1c9" + "md5sum": "137ce81a2aef53ce819f2ddcba2662a9" }, { "dataPath": "params_shard_21.bin", @@ -1064,7 +1064,7 @@ "byteOffset": 0 } ], - "md5sum": "324d6fab6d373401073546ed03d39211" + "md5sum": "57f52a6294ba07ccfd40862302abfeb0" }, { "dataPath": "params_shard_22.bin", @@ -1137,7 +1137,7 @@ "byteOffset": 22026240 } ], - "md5sum": "8e042a2e177639cb2ff674f3a7266210" + "md5sum": "fb637e3862f096624612a89e5d550586" }, { "dataPath": "params_shard_23.bin", @@ -1156,7 +1156,7 @@ "byteOffset": 0 } ], - "md5sum": "e92a94d89f861c2c5e9d08f206b7bc1c" + "md5sum": "c4a2128471bb8163d1155d4428a3e096" }, { "dataPath": "params_shard_24.bin", @@ -1239,7 +1239,7 @@ "byteOffset": 33232896 } ], - "md5sum": "af4e357109ce0dd01c3ea75acb8aaa1a" + "md5sum": "8f46c0f65098b2f7150326e2032cad8e" }, { "dataPath": "params_shard_25.bin", @@ -1301,7 +1301,7 @@ "byteOffset": 21233664 } ], - "md5sum": "303caa4cee9e70c8bd1066464c2ea849" + "md5sum": "75acd30a2b79d831f7db532a8999a1f3" }, { "dataPath": "params_shard_26.bin", @@ -1320,7 +1320,7 @@ "byteOffset": 0 } ], - "md5sum": "70b2cf47e9e55432dd9088afd8e9a83e" + "md5sum": "8d06da6215b2c8aa873f4c228389f389" }, { "dataPath": "params_shard_27.bin", @@ -1393,7 +1393,7 @@ "byteOffset": 22026240 } ], - "md5sum": "c94a2d330f9cb37c8a61cf90deb0b45f" + "md5sum": "4f7f06d0c1fc498bcd4128e6a62b01ba" }, { "dataPath": "params_shard_28.bin", @@ -1412,7 +1412,7 @@ "byteOffset": 0 } ], - "md5sum": "b76a9a27c46ac52bddcd744b605564a9" + "md5sum": "dd4a9fc77672f3d4c5b29e3167fd4881" }, { "dataPath": "params_shard_29.bin", @@ -1495,7 +1495,7 @@ "byteOffset": 33232896 } ], - "md5sum": "fc3908ef1ff4fab5a81adf786477d8b4" + "md5sum": "86a3a85df8b0d7a1237d036a46ad6a8e" }, { "dataPath": "params_shard_30.bin", @@ -1557,7 +1557,7 @@ "byteOffset": 21233664 } ], - "md5sum": "3df7172b8ec78578295ca75338a0c32e" + "md5sum": "3f10adaed93c9b7fb821bc8b1f35659e" }, { "dataPath": "params_shard_31.bin", @@ -1576,7 +1576,7 @@ "byteOffset": 0 } ], - "md5sum": "bd5f5975f4b7f21f2554644da9da6f5a" + "md5sum": "6ddec1d838994a89efa5c5534a00f63a" }, { "dataPath": "params_shard_32.bin", @@ -1649,7 +1649,7 @@ "byteOffset": 22026240 } ], - "md5sum": "fb63daef7fca12dea591efd21b9d9c14" + "md5sum": "196b53103b396b64b908064f9984b4b7" }, { "dataPath": "params_shard_33.bin", @@ -1668,7 +1668,7 @@ "byteOffset": 0 } ], - "md5sum": "6511803dfb93c3e3ce95b0dd94e1270d" + "md5sum": "f913ba05408e86b44bc31f5a275e9cb1" }, { "dataPath": "params_shard_34.bin", @@ -1751,7 +1751,7 @@ "byteOffset": 33232896 } ], - "md5sum": "acd04c251a6a0b8a09fa648724078f9f" + "md5sum": "0ed9f2a3baa6009111345e9fd08c0fe8" }, { "dataPath": "params_shard_35.bin", @@ -1770,7 +1770,7 @@ "byteOffset": 0 } ], - "md5sum": "424943277254877ab0a7690d3839c6af" + "md5sum": "ba96aa7c1453daa5716bf285fc9e0332" }, { "dataPath": "params_shard_36.bin", @@ -1853,7 +1853,7 @@ "byteOffset": 27396096 } ], - "md5sum": "6e3c5ead604216089bb2bd02a4329a5a" + "md5sum": "956c42c6309a4a9e50ac3273a1dfe096" }, { "dataPath": "params_shard_37.bin", @@ -1872,7 +1872,7 @@ "byteOffset": 0 } ], - "md5sum": "044a1b344b2891ed7f019e9757264f23" + "md5sum": "70ec8bdbd4f6edee811b13e8382e6d31" }, { "dataPath": "params_shard_38.bin", @@ -1945,7 +1945,7 @@ "byteOffset": 22026240 } ], - "md5sum": "203e211d7b41621ac79a6cf68e143d10" + "md5sum": "30a7c74e2dabfffe2c79084684693ff9" }, { "dataPath": "params_shard_39.bin", @@ -1964,7 +1964,7 @@ "byteOffset": 0 } ], - "md5sum": "e85ef9ff37755c08ce31c1aa203216a6" + "md5sum": "19808d9fb46a8dbe89f96ef7fcbde15b" }, { "dataPath": "params_shard_40.bin", @@ -2047,7 +2047,7 @@ "byteOffset": 33232896 } ], - "md5sum": "315bdc92c799dd2d5e4f3d5f56606ab0" + "md5sum": "e9ce9615c09f57448e2ce79382a96f14" }, { "dataPath": "params_shard_41.bin", @@ -2109,7 +2109,7 @@ "byteOffset": 21233664 } ], - "md5sum": "54074992d6adab3a53bb5113104dc2a2" + "md5sum": "fc45420316ea727605be5d7e0ed8e9da" }, { "dataPath": "params_shard_42.bin", @@ -2128,7 +2128,7 @@ "byteOffset": 0 } ], - "md5sum": "583cf91ed8d73e29c53be3ba8e6b0157" + "md5sum": "7b52744731cd22ca6bf33ee27302e1e3" }, { "dataPath": "params_shard_43.bin", @@ -2201,7 +2201,7 @@ "byteOffset": 22026240 } ], - "md5sum": "6ec2356dc75920d46ae39ff75a61e327" + "md5sum": "7016666073af181d421de47db3cd2df4" }, { "dataPath": "params_shard_44.bin", @@ -2220,7 +2220,7 @@ "byteOffset": 0 } ], - "md5sum": "0c8fac4fdb901171c0687163c39bfb24" + "md5sum": "da8ffafadefa5bee6e92402a262c1591" }, { "dataPath": "params_shard_45.bin", @@ -2303,7 +2303,7 @@ "byteOffset": 33232896 } ], - "md5sum": "f04da33a046700d1fd0c52d1a748b20f" + "md5sum": "579ea893625576de7ec6c925c8e472a5" }, { "dataPath": "params_shard_46.bin", @@ -2365,7 +2365,7 @@ "byteOffset": 21233664 } ], - "md5sum": "94bce31b25ff3751bd949ee2651ff3b0" + "md5sum": "3e3a519e78b6d214c6935bf47d9fd6da" }, { "dataPath": "params_shard_47.bin", @@ -2384,7 +2384,7 @@ "byteOffset": 0 } ], - "md5sum": "deb5606d247d964e84946eb2acf96f17" + "md5sum": "01263e0f52d5530fd5dcce9d6e558faf" }, { "dataPath": "params_shard_48.bin", @@ -2457,7 +2457,7 @@ "byteOffset": 22026240 } ], - "md5sum": "147b605c605618800546ef40d9f7dfd9" + "md5sum": "df492083954171dd0f29c8347415ad4c" }, { "dataPath": "params_shard_49.bin", @@ -2476,7 +2476,7 @@ "byteOffset": 0 } ], - "md5sum": "c9e508bb9637f442a61701f39953c947" + "md5sum": "26e9da272c07b9e3164ee39204001b1a" }, { "dataPath": "params_shard_50.bin", @@ -2559,7 +2559,7 @@ "byteOffset": 33232896 } ], - "md5sum": "54e8325797a3869da3e17f7137347f37" + "md5sum": "515c4b3a001119843a14b1ebb186f53e" }, { "dataPath": "params_shard_51.bin", @@ -2621,7 +2621,7 @@ "byteOffset": 21233664 } ], - "md5sum": "d2df7b8d4d0a89dd25e2c890d09ba7ac" + "md5sum": "e852ade5c26bd91ab0fa82467a3777c6" }, { "dataPath": "params_shard_52.bin", @@ -2640,7 +2640,7 @@ "byteOffset": 0 } ], - "md5sum": "8f64903fe513470efaea44cb44882554" + "md5sum": "0adac2bada661247eab94698103f825d" }, { "dataPath": "params_shard_53.bin", @@ -2713,7 +2713,7 @@ "byteOffset": 22026240 } ], - "md5sum": "3aa4555b974bea81381743734646ac6f" + "md5sum": "4a35f0ddaaab6863a2c5a3e4a407a249" }, { "dataPath": "params_shard_54.bin", @@ -2732,7 +2732,7 @@ "byteOffset": 0 } ], - "md5sum": "9bdaa9ffa45dbeba3f15230433248a45" + "md5sum": "9c9045251d6bd64178aee3423ba02d53" }, { "dataPath": "params_shard_55.bin", @@ -2815,7 +2815,7 @@ "byteOffset": 33232896 } ], - "md5sum": "a4838335ebbe75771cf31aee80e9386b" + "md5sum": "678735984da6a7c65a985ea9bcdd9e1d" }, { "dataPath": "params_shard_56.bin", @@ -2877,7 +2877,7 @@ "byteOffset": 21233664 } ], - "md5sum": "54597a723cf21d0eef770522979d21ba" + "md5sum": "6faf93f32ebae44e2316776e943b73d5" }, { "dataPath": "params_shard_57.bin", @@ -2896,7 +2896,7 @@ "byteOffset": 0 } ], - "md5sum": "55c07771f9d95822295047a776e4e716" + "md5sum": "7c906b3f2d0a23b4b404f384ada6c863" }, { "dataPath": "params_shard_58.bin", @@ -2969,7 +2969,7 @@ "byteOffset": 22026240 } ], - "md5sum": "e292be869f50f3f22711ede0efca8e99" + "md5sum": "d5a7ef52b511ca5c6607c93718976580" }, { "dataPath": "params_shard_59.bin", @@ -2988,7 +2988,7 @@ "byteOffset": 0 } ], - "md5sum": "fc5c9bf4993163454cac074473ec84ff" + "md5sum": "7835aa22e5fc3ab43904a7ba317dd05e" }, { "dataPath": "params_shard_60.bin", @@ -3071,7 +3071,7 @@ "byteOffset": 33232896 } ], - "md5sum": "35b09aad431916ab9986914db9feaa15" + "md5sum": "97c2f05f64c9839ba60e57e830c919e6" }, { "dataPath": "params_shard_61.bin", @@ -3155,7 +3155,7 @@ "byteOffset": 26542080 } ], - "md5sum": "d612bf0a65838fe9cd7c5338b0ab2d1a" + "md5sum": "8f2cc14e740a795d3945a92bca16366a" }, { "dataPath": "params_shard_62.bin", @@ -3174,7 +3174,7 @@ "byteOffset": 0 } ], - "md5sum": "a334b0a59263051527b3959507c2059f" + "md5sum": "56f2f22839c6b77063e3a90f30122137" }, { "dataPath": "params_shard_63.bin", @@ -3247,7 +3247,7 @@ "byteOffset": 22026240 } ], - "md5sum": "ff92efa38feb0013fbeeeb24a6beb6a2" + "md5sum": "f69a2221a90921e660620770b711fd17" }, { "dataPath": "params_shard_64.bin", @@ -3266,7 +3266,7 @@ "byteOffset": 0 } ], - "md5sum": "1030ee4948f7cc79712705800b13e010" + "md5sum": "c6e8789cf22bfb7a983b1834e983dd6e" }, { "dataPath": "params_shard_65.bin", @@ -3349,7 +3349,7 @@ "byteOffset": 33232896 } ], - "md5sum": "1d2e26f38ce827dce9e614d53fbae96b" + "md5sum": "0273ecef5ee3e36de92d20e60a6091a0" }, { "dataPath": "params_shard_66.bin", @@ -3411,7 +3411,7 @@ "byteOffset": 21233664 } ], - "md5sum": "5d4f870aa25b56a966e21e557b6a5689" + "md5sum": "5026939da604c97430a95d2026bb282c" }, { "dataPath": "params_shard_67.bin", @@ -3430,7 +3430,7 @@ "byteOffset": 0 } ], - "md5sum": "b8512fae8f93fbd9f4f7f73337311990" + "md5sum": "6c825a7113de38b7e100f9e7f45fc976" }, { "dataPath": "params_shard_68.bin", @@ -3503,7 +3503,7 @@ "byteOffset": 22026240 } ], - "md5sum": "dca262e67f5875824b6cb19b77b87f2b" + "md5sum": "e8545eb30fe53e7a9809bcbc52e5edc7" }, { "dataPath": "params_shard_69.bin", @@ -3522,7 +3522,7 @@ "byteOffset": 0 } ], - "md5sum": "95e02febe339e87fd2dc66e8720d5724" + "md5sum": "1bb546cc943cea45bd5a83dca1919c16" }, { "dataPath": "params_shard_70.bin", @@ -3605,7 +3605,7 @@ "byteOffset": 33232896 } ], - "md5sum": "9ffc11f2725ba1a6a50397edb5970b7b" + "md5sum": "3c5add49f666f50d75e351c3758271f1" }, { "dataPath": "params_shard_71.bin", @@ -3667,7 +3667,7 @@ "byteOffset": 21233664 } ], - "md5sum": "b82024bf6121748baaa0b2e15f45292a" + "md5sum": "b9817824fd05540c9968991b4973535f" }, { "dataPath": "params_shard_72.bin", @@ -3686,7 +3686,7 @@ "byteOffset": 0 } ], - "md5sum": "74351377410f94f98f638d90086a3ba3" + "md5sum": "2cbf2b759939a9c467cdcd7a35ba6ce7" }, { "dataPath": "params_shard_73.bin", @@ -3759,7 +3759,7 @@ "byteOffset": 22026240 } ], - "md5sum": "8fcac7f6ef447f7857682429ee194f8c" + "md5sum": "3f972e64e6d289c178af439b37093a27" }, { "dataPath": "params_shard_74.bin", @@ -3778,7 +3778,7 @@ "byteOffset": 0 } ], - "md5sum": "92d2cc1b281e6bb28f465b49ff9b208c" + "md5sum": "a2f722107d2de12aa1644399cd04810a" }, { "dataPath": "params_shard_75.bin", @@ -3861,7 +3861,7 @@ "byteOffset": 33232896 } ], - "md5sum": "5db69c637c72f53238fa9c6f55f2d4ef" + "md5sum": "c6eaaee1e69bfad8b25eaac488987947" }, { "dataPath": "params_shard_76.bin", @@ -3923,7 +3923,7 @@ "byteOffset": 21233664 } ], - "md5sum": "18aac3937281d4613c4bebe4fef0e9f5" + "md5sum": "83155bcc2223493f6ca1afce08a7e233" }, { "dataPath": "params_shard_77.bin", @@ -3942,7 +3942,7 @@ "byteOffset": 0 } ], - "md5sum": "e6cfafe2fc17539ef7a158a9c123d35c" + "md5sum": "aa3e3bbca10469c352e931114e4352e5" }, { "dataPath": "params_shard_78.bin", @@ -4015,7 +4015,7 @@ "byteOffset": 22026240 } ], - "md5sum": "d095dac880afc3e18c3ce261f3fa747e" + "md5sum": "11036296e1ab0f3fc2aad53eea717d1d" }, { "dataPath": "params_shard_79.bin", @@ -4034,7 +4034,7 @@ "byteOffset": 0 } ], - "md5sum": "ced88ec5fc5b74c9a3131e2cbc474bc9" + "md5sum": "698469bf0d9056a98e7b4b95100337ce" }, { "dataPath": "params_shard_80.bin", @@ -4117,12 +4117,12 @@ "byteOffset": 33232896 } ], - "md5sum": "62a16d6f9c5485e7c09d371f33dd08d3" + "md5sum": "72d7706eb3e77d679c1a21db987444f9" }, { "dataPath": "params_shard_81.bin", "format": "raw-shard", - "nbytes": 32262720, + "nbytes": 32036864, "records": [ { "name": "model.h.9.mixer.out_proj.q_weight", @@ -4204,26 +4204,15 @@ "byteOffset": 21243904 }, { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.weight", "shape": [ 577, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 295424, - "byteOffset": 22448128 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.embeddings.position_embedding.q_scale", - "shape": [ - 577, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 36928, - "byteOffset": 22743552 + "nbytes": 1181696, + "byteOffset": 22448128 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.bias", @@ -4233,7 +4222,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22780480 + "byteOffset": 23629824 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm1.weight", @@ -4243,7 +4232,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22782528 + "byteOffset": 23631872 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.bias", @@ -4253,7 +4242,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22784576 + "byteOffset": 23633920 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.layer_norm2.weight", @@ -4263,7 +4252,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22786624 + "byteOffset": 23635968 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.bias", @@ -4273,29 +4262,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 22788672 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 22796864 + "byteOffset": 23638016 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 24894016 + "nbytes": 8388608, + "byteOffset": 23646208 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.bias", @@ -4305,29 +4283,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25156160 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 25158208 - }, + "byteOffset": 32034816 + } + ], + "md5sum": "06eb2520ad6b2dfb6527b035312460c8" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 27255360 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.bias", @@ -4337,29 +4312,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27517504 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27519552 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28043840 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.bias", @@ -4369,29 +4333,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28109376 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 28111424 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28635712 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.bias", @@ -4401,29 +4354,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28701248 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 28703296 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 29227584 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.bias", @@ -4433,29 +4375,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29293120 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 29295168 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.0.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 29819456 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.bias", @@ -4465,7 +4396,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29884992 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm1.weight", @@ -4475,7 +4406,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29887040 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.bias", @@ -4485,7 +4416,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29889088 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.layer_norm2.weight", @@ -4495,7 +4426,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29891136 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.bias", @@ -4505,29 +4436,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 29893184 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 29901376 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 31998528 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.bias", @@ -4537,37 +4457,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32260672 + "byteOffset": 25190400 } ], - "md5sum": "f31749651cdc2e1f7cb48008e11e163a" + "md5sum": "12ccc3786467895471d31bb5b1d2610c" }, { - "dataPath": "params_shard_82.bin", + "dataPath": "params_shard_83.bin", "format": "raw-shard", - "nbytes": 33161216, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.bias", @@ -4577,29 +4486,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2361344 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 2885632 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.bias", @@ -4609,29 +4507,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2951168 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2953216 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 3477504 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.bias", @@ -4641,29 +4528,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3543040 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 3545088 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4069376 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.bias", @@ -4673,29 +4549,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4134912 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4136960 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.1.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4661248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.bias", @@ -4705,7 +4570,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4726784 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm1.weight", @@ -4715,7 +4580,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4728832 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.bias", @@ -4725,7 +4590,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4730880 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.layer_norm2.weight", @@ -4735,7 +4600,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4732928 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.bias", @@ -4745,29 +4610,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 4734976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 4743168 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 6840320 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.bias", @@ -4777,29 +4631,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7102464 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "dcc2adf61aa07fe189bb15874110e845" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.bias", @@ -4809,29 +4660,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 9465856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 9990144 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.bias", @@ -4841,29 +4681,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10055680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10057728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 10582016 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.bias", @@ -4873,29 +4702,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10647552 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10649600 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11173888 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.bias", @@ -4905,29 +4723,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11239424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11241472 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.10.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11765760 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.bias", @@ -4937,7 +4744,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11831296 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm1.weight", @@ -4947,7 +4754,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11833344 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.bias", @@ -4957,7 +4764,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11835392 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.layer_norm2.weight", @@ -4967,7 +4774,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11837440 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.bias", @@ -4977,29 +4784,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 11839488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 11847680 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 13944832 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.bias", @@ -5009,29 +4805,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14206976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "9f8d49d8894a05f4179ba707925e9d59" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.bias", @@ -5041,29 +4834,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 16570368 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17094656 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.bias", @@ -5073,29 +4855,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17160192 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17162240 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17686528 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.bias", @@ -5105,29 +4876,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17752064 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17754112 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18278400 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.bias", @@ -5137,29 +4897,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18343936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18345984 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.11.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18870272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.bias", @@ -5169,7 +4918,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18935808 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm1.weight", @@ -5179,7 +4928,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18937856 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.bias", @@ -5189,7 +4938,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18939904 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.layer_norm2.weight", @@ -5199,7 +4948,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18941952 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.bias", @@ -5209,29 +4958,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18944000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 18952192 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 21049344 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.bias", @@ -5241,29 +4979,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21311488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "19b6f5d2cfc839108f9156b8b521d3ce" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.bias", @@ -5273,29 +5008,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 23674880 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24199168 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.bias", @@ -5305,29 +5029,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24264704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24266752 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24791040 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.bias", @@ -5337,29 +5050,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24856576 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24858624 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25382912 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.bias", @@ -5369,29 +5071,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25448448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 25450496 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.12.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25974784 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.bias", @@ -5401,7 +5092,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26040320 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm1.weight", @@ -5411,7 +5102,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26042368 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.bias", @@ -5421,7 +5112,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26044416 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.layer_norm2.weight", @@ -5431,7 +5122,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26046464 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.bias", @@ -5441,29 +5132,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 26048512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 26056704 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 28153856 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.bias", @@ -5473,29 +5153,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28416000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 28418048 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "3e6322c0673873144d67964c709fa3be" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 30515200 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.bias", @@ -5505,29 +5182,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30777344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 30779392 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31303680 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.bias", @@ -5537,29 +5203,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31369216 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31371264 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31895552 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.bias", @@ -5569,29 +5224,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31961088 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31963136 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 32487424 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.bias", @@ -5601,29 +5245,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32552960 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 32555008 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.13.self_attn.v_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 33079296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.bias", @@ -5633,7 +5266,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33144832 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm1.weight", @@ -5643,7 +5276,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33146880 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.bias", @@ -5653,7 +5286,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33148928 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.layer_norm2.weight", @@ -5663,7 +5296,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33150976 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.bias", @@ -5673,37 +5306,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 33153024 - } - ], - "md5sum": "f08b634e46a63d50279fc8be715cd065" - }, - { - "dataPath": "params_shard_83.bin", - "format": "raw-shard", - "nbytes": 33140736, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.bias", @@ -5713,29 +5327,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 2361344 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "f04370015a40ae2073f5d89ad86f1c42" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 4458496 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.bias", @@ -5745,29 +5356,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4720640 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4722688 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5246976 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.bias", @@ -5777,29 +5377,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5312512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5314560 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5838848 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.bias", @@ -5809,29 +5398,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5904384 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5906432 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 6430720 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.bias", @@ -5841,29 +5419,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6496256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 6498304 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.14.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 7022592 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.bias", @@ -5873,7 +5440,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7088128 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm1.weight", @@ -5883,7 +5450,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7090176 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.bias", @@ -5893,7 +5460,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7092224 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.layer_norm2.weight", @@ -5903,7 +5470,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7094272 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.bias", @@ -5913,29 +5480,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 7096320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.bias", @@ -5945,29 +5501,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 9465856 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e2c99d455ee851ede30d282481166453" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 11563008 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.bias", @@ -5977,29 +5530,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11825152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11827200 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12351488 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.bias", @@ -6009,29 +5551,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12417024 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 12419072 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12943360 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.bias", @@ -6041,29 +5572,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13008896 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13010944 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 13535232 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.bias", @@ -6073,29 +5593,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13600768 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13602816 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.15.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 14127104 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.bias", @@ -6105,7 +5614,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14192640 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm1.weight", @@ -6115,7 +5624,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14194688 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.bias", @@ -6125,7 +5634,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14196736 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.layer_norm2.weight", @@ -6135,7 +5644,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14198784 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.bias", @@ -6145,29 +5654,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 14200832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.bias", @@ -6177,29 +5675,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 16570368 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "11c75f74757caccc61b9f6c3f39a9737" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 18667520 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.bias", @@ -6209,29 +5704,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18929664 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18931712 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 19456000 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.bias", @@ -6241,29 +5725,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19521536 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 19523584 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20047872 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.bias", @@ -6273,29 +5746,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20113408 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20115456 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20639744 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.bias", @@ -6305,29 +5767,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20705280 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20707328 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.16.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 21231616 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.bias", @@ -6337,7 +5788,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21297152 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm1.weight", @@ -6347,7 +5798,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21299200 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.bias", @@ -6357,7 +5808,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21301248 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.layer_norm2.weight", @@ -6367,7 +5818,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21303296 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.bias", @@ -6377,29 +5828,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 21305344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.bias", @@ -6409,29 +5849,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 23674880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "a7f57fd25793b85aa6027a514efc39fb" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 25772032 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.bias", @@ -6441,29 +5878,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26034176 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26036224 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 26560512 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.bias", @@ -6473,29 +5899,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26626048 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26628096 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.out_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27152384 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.bias", @@ -6505,29 +5920,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27217920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27219968 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27744256 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.bias", @@ -6537,29 +5941,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27809792 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27811840 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.17.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28336128 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.bias", @@ -6569,7 +5962,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28401664 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm1.weight", @@ -6579,7 +5972,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28403712 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.bias", @@ -6589,7 +5982,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28405760 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.layer_norm2.weight", @@ -6599,7 +5992,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28407808 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.bias", @@ -6609,29 +6002,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 28409856 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 28418048 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 30515200 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.bias", @@ -6641,29 +6023,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30777344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 30779392 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e13228942bc433e638fe3903001715f3" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 32876544 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.bias", @@ -6673,37 +6052,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33138688 - } - ], - "md5sum": "a0e8309f607c57253603f2ffd504cce4" - }, - { - "dataPath": "params_shard_84.bin", - "format": "raw-shard", - "nbytes": 33161216, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 0 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 524288 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.bias", @@ -6713,29 +6073,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 589824 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 591872 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 1116160 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.bias", @@ -6745,29 +6094,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1181696 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 1183744 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 1708032 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.bias", @@ -6777,29 +6115,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 1773568 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 1775616 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.18.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 2299904 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.bias", @@ -6809,7 +6136,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2365440 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm1.weight", @@ -6819,7 +6146,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2367488 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.bias", @@ -6829,7 +6156,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2369536 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.layer_norm2.weight", @@ -6839,7 +6166,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2371584 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.bias", @@ -6849,29 +6176,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 2373632 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.weight", "shape": [ 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 2381824 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc1.q_scale", - "shape": [ - 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 4478976 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.bias", @@ -6881,29 +6197,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4741120 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 4743168 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "eab0a6fc1a1e3beac991a0be01fdefe8" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 6840320 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.bias", @@ -6913,29 +6226,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7102464 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 7104512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 7628800 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.bias", @@ -6945,29 +6247,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7694336 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 7696384 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 8220672 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.bias", @@ -6977,29 +6268,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8286208 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 8288256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.q_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 8812544 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.bias", @@ -7009,29 +6289,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 8878080 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 8880128 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.19.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 9404416 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.bias", @@ -7041,7 +6310,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9469952 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm1.weight", @@ -7051,7 +6320,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9472000 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.bias", @@ -7061,7 +6330,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9474048 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.layer_norm2.weight", @@ -7071,7 +6340,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9476096 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.bias", @@ -7081,29 +6350,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 9478144 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 9486336 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 11583488 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.bias", @@ -7113,29 +6371,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11845632 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 11847680 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "afcfd0263f305fcc63e7b86393753bf7" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 13944832 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.bias", @@ -7145,29 +6400,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14206976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 14209024 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 14733312 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.bias", @@ -7177,29 +6421,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14798848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 14800896 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 15325184 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.bias", @@ -7209,29 +6442,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15390720 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 15392768 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 15917056 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.bias", @@ -7241,29 +6463,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 15982592 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 15984640 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.2.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 16508928 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.bias", @@ -7273,7 +6484,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16574464 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm1.weight", @@ -7283,7 +6494,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16576512 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.bias", @@ -7293,145 +6504,109 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16578560 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.weight", - "shape": [ - 1024 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 16580608 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.bias", - "shape": [ - 4096 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 8192, - "byteOffset": 16582656 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 16590848 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.q_scale", - "shape": [ - 4096, - 32 - ], - "dtype": "float16", - "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 18688000 + "byteOffset": 16789504 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.layer_norm2.weight", "shape": [ 1024 ], "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18950144 + "byteOffset": 16791552 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.bias", "shape": [ - 1024, - 512 + 4096 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 18952192 + "nbytes": 8192, + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc1.weight", "shape": [ - 1024, - 128 + 4096, + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 21049344 + "nbytes": 8388608, + "byteOffset": 16801792 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.bias", "shape": [ 1024 ], "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21311488 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "460a8bc76edf812f85886ec9f950f395" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 21313536 + "nbytes": 8388608, + "byteOffset": 0 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.bias", "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 21837824 + "nbytes": 2048, + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.bias", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.k_proj.weight", "shape": [ + 1024, 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 21903360 + "nbytes": 2097152, + "byteOffset": 8390656 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.bias", "shape": [ - 1024, - 128 + 1024 ], - "dtype": "uint32", + "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 21905408 + "nbytes": 2048, + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 22429696 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.bias", @@ -7441,29 +6616,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 22495232 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 22497280 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 23021568 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.bias", @@ -7473,29 +6637,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23087104 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 23089152 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.20.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 23613440 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.bias", @@ -7505,7 +6658,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23678976 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm1.weight", @@ -7515,7 +6668,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23681024 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.bias", @@ -7525,7 +6678,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23683072 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.layer_norm2.weight", @@ -7535,7 +6688,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23685120 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.bias", @@ -7545,29 +6698,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 23687168 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 23695360 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 25792512 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.bias", @@ -7577,29 +6719,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26054656 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 26056704 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "bcac984764bba0a4eb9891d2043e1d89" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 28153856 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.bias", @@ -7609,29 +6748,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28416000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 28418048 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28942336 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.bias", @@ -7641,29 +6769,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29007872 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 29009920 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 29534208 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.bias", @@ -7673,29 +6790,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 29599744 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 29601792 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 30126080 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.bias", @@ -7705,29 +6811,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30191616 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 30193664 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.21.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 30717952 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.bias", @@ -7737,7 +6832,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30783488 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm1.weight", @@ -7747,7 +6842,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30785536 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.bias", @@ -7757,7 +6852,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30787584 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.layer_norm2.weight", @@ -7767,7 +6862,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30789632 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.bias", @@ -7777,29 +6872,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 30791680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 30799872 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 32897024 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.bias", @@ -7809,37 +6893,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33159168 + "byteOffset": 25190400 } ], - "md5sum": "10ad505e9ab90b00640b5382d9bb5582" + "md5sum": "3197e582d745d84c2ab4347a1f2d4e2d" }, { - "dataPath": "params_shard_85.bin", + "dataPath": "params_shard_97.bin", "format": "raw-shard", - "nbytes": 33161216, + "nbytes": 25192448, "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.bias", @@ -7849,29 +6922,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2361344 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 2885632 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.bias", @@ -7881,29 +6943,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2951168 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 2953216 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 3477504 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.bias", @@ -7913,29 +6964,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 3543040 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 3545088 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4069376 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.bias", @@ -7945,29 +6985,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4134912 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4136960 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.22.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 4661248 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.bias", @@ -7977,7 +7006,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4726784 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm1.weight", @@ -7987,7 +7016,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4728832 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.bias", @@ -7997,7 +7026,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4730880 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.layer_norm2.weight", @@ -8007,7 +7036,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4732928 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.bias", @@ -8017,29 +7046,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 4734976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 4743168 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 6840320 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.bias", @@ -8049,29 +7067,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7102464 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "e6d67ae9f4dab5ea49fac79bceac7a86" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.bias", @@ -8081,29 +7096,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 9465856 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 9990144 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.bias", @@ -8113,29 +7117,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 10055680 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10057728 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 10582016 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.bias", @@ -8144,30 +7137,19 @@ ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 2048, - "byteOffset": 10647552 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 10649600 + "nbytes": 2048, + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11173888 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.bias", @@ -8177,29 +7159,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11239424 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11241472 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.23.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 11765760 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.bias", @@ -8209,7 +7180,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11831296 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm1.weight", @@ -8219,7 +7190,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11833344 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.bias", @@ -8229,7 +7200,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11835392 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.layer_norm2.weight", @@ -8239,7 +7210,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11837440 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.bias", @@ -8249,29 +7220,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 11839488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 11847680 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 13944832 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.bias", @@ -8281,29 +7241,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14206976 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "1a74510bf14d6fc06b53f09ee6a22fdd" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.bias", @@ -8313,29 +7270,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 16570368 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17094656 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.bias", @@ -8345,29 +7291,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17160192 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17162240 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 17686528 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.bias", @@ -8377,29 +7312,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 17752064 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 17754112 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18278400 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.bias", @@ -8409,29 +7333,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18343936 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18345984 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.3.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 18870272 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.bias", @@ -8441,7 +7354,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18935808 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm1.weight", @@ -8451,7 +7364,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18937856 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.bias", @@ -8461,7 +7374,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18939904 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.layer_norm2.weight", @@ -8471,7 +7384,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18941952 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.bias", @@ -8481,29 +7394,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 18944000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 18952192 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 21049344 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.bias", @@ -8513,29 +7415,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21311488 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "75a9ee23e852e5562e2176a5ece04f24" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.bias", @@ -8545,29 +7444,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 23674880 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24199168 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.bias", @@ -8577,29 +7465,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24264704 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24266752 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 24791040 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.bias", @@ -8609,29 +7486,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 24856576 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 24858624 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25382912 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.bias", @@ -8641,29 +7507,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 25448448 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 25450496 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.4.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 25974784 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.bias", @@ -8673,7 +7528,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26040320 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm1.weight", @@ -8683,7 +7538,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26042368 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.bias", @@ -8693,7 +7548,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26044416 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.layer_norm2.weight", @@ -8703,7 +7558,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26046464 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.bias", @@ -8713,29 +7568,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 26048512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 26056704 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 28153856 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.bias", @@ -8745,29 +7589,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28416000 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 28418048 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "da3f4d64dad38aa57a47fd6fbca1a334" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 30515200 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.bias", @@ -8777,29 +7618,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 30777344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 30779392 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31303680 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.bias", @@ -8809,29 +7639,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31369216 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31371264 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 31895552 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.bias", @@ -8841,29 +7660,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 31961088 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 31963136 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 32487424 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.bias", @@ -8873,29 +7681,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 32552960 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 32555008 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.5.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 33079296 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.bias", @@ -8905,7 +7702,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33144832 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm1.weight", @@ -8915,7 +7712,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33146880 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.bias", @@ -8925,7 +7722,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33148928 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.layer_norm2.weight", @@ -8935,7 +7732,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 33150976 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.bias", @@ -8945,37 +7742,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 33153024 - } - ], - "md5sum": "16f33cc460696f29368f48352e15c0cb" - }, - { - "dataPath": "params_shard_86.bin", - "format": "raw-shard", - "nbytes": 28416000, - "records": [ - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 0 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 2097152 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.bias", @@ -8985,29 +7763,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 2359296 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 2361344 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "ca1eb7481171d37cc9fab4b3432d81d1" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 4458496 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.bias", @@ -9017,29 +7792,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 4720640 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_weight", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.weight", "shape": [ 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 4722688 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.k_proj.q_scale", - "shape": [ - 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5246976 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.bias", @@ -9049,29 +7813,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5312512 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5314560 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 5838848 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.bias", @@ -9081,29 +7834,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 5904384 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 5906432 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 6430720 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.bias", @@ -9113,29 +7855,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 6496256 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 6498304 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.6.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 7022592 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.bias", @@ -9145,7 +7876,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7088128 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm1.weight", @@ -9155,7 +7886,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7090176 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.bias", @@ -9165,7 +7896,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7092224 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.layer_norm2.weight", @@ -9175,7 +7906,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 7094272 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.bias", @@ -9185,29 +7916,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 7096320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 7104512 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 9201664 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.bias", @@ -9217,29 +7937,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 9463808 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 9465856 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "03be4317a6855a15625866d5dde56763" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 11563008 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.bias", @@ -9249,29 +7966,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 11825152 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 11827200 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12351488 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.bias", @@ -9281,29 +7987,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 12417024 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 12419072 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 12943360 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.bias", @@ -9313,29 +8008,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13008896 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13010944 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 13535232 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.bias", @@ -9345,29 +8029,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 13600768 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 13602816 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.7.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 14127104 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.bias", @@ -9377,7 +8050,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14192640 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm1.weight", @@ -9387,7 +8060,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14194688 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.bias", @@ -9397,7 +8070,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14196736 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.layer_norm2.weight", @@ -9407,7 +8080,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 14198784 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.bias", @@ -9417,29 +8090,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 14200832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 14209024 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 16306176 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.bias", @@ -9449,29 +8111,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 16568320 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 16570368 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "7464cccd529310def6e3920c637ad62c" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 25192448, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 18667520 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.bias", @@ -9481,29 +8140,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 18929664 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 18931712 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 19456000 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.bias", @@ -9513,29 +8161,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 19521536 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 19523584 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20047872 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.bias", @@ -9545,29 +8182,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20113408 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20115456 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 20639744 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.bias", @@ -9577,29 +8203,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 20705280 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 20707328 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.8.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 21231616 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.bias", @@ -9609,7 +8224,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21297152 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm1.weight", @@ -9619,7 +8234,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21299200 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.bias", @@ -9629,7 +8244,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21301248 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.layer_norm2.weight", @@ -9639,7 +8254,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 21303296 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.bias", @@ -9649,29 +8264,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 21305344 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_weight", - "shape": [ - 4096, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 21313536 + "byteOffset": 16793600 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc1.weight", "shape": [ 4096, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 23410688 + "nbytes": 8388608, + "byteOffset": 16801792 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.bias", @@ -9681,29 +8285,26 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 23672832 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_weight", - "shape": [ - 1024, - 512 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 2097152, - "byteOffset": 23674880 - }, + "byteOffset": 25190400 + } + ], + "md5sum": "8be48481c922751c9b723a99e5dcd727" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 29200384, + "records": [ { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.mlp.fc2.weight", "shape": [ 1024, - 128 + 4096 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 262144, - "byteOffset": 25772032 + "nbytes": 8388608, + "byteOffset": 0 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.bias", @@ -9713,29 +8314,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26034176 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26036224 + "byteOffset": 8388608 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.k_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 26560512 + "nbytes": 2097152, + "byteOffset": 8390656 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.bias", @@ -9745,29 +8335,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 26626048 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 26628096 + "byteOffset": 10487808 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.out_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27152384 + "nbytes": 2097152, + "byteOffset": 10489856 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.bias", @@ -9777,29 +8356,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27217920 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27219968 + "byteOffset": 12587008 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.q_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 27744256 + "nbytes": 2097152, + "byteOffset": 12589056 }, { "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.bias", @@ -9809,29 +8377,18 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 27809792 - }, - { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_weight", - "shape": [ - 1024, - 128 - ], - "dtype": "uint32", - "format": "f32-to-bf16", - "nbytes": 524288, - "byteOffset": 27811840 + "byteOffset": 14686208 }, { - "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.q_scale", + "name": "vision_embed_tokens.img_processor.vision_model.encoder.layers.9.self_attn.v_proj.weight", "shape": [ 1024, - 32 + 1024 ], "dtype": "float16", "format": "f32-to-bf16", - "nbytes": 65536, - "byteOffset": 28336128 + "nbytes": 2097152, + "byteOffset": 14688256 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.bias", @@ -9841,7 +8398,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28401664 + "byteOffset": 16785408 }, { "name": "vision_embed_tokens.img_processor.vision_model.post_layernorm.weight", @@ -9851,7 +8408,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28403712 + "byteOffset": 16787456 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.bias", @@ -9861,7 +8418,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28405760 + "byteOffset": 16789504 }, { "name": "vision_embed_tokens.img_processor.vision_model.pre_layrnorm.weight", @@ -9871,7 +8428,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 2048, - "byteOffset": 28407808 + "byteOffset": 16791552 }, { "name": "vision_embed_tokens.img_projection.linear_1.bias", @@ -9881,16 +8438,8 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 28409856 - } - ], - "md5sum": "027e3a724b350d7591cb6ed3fc9ec2a0" - }, - { - "dataPath": "params_shard_87.bin", - "format": "raw-shard", - "nbytes": 12400640, - "records": [ + "byteOffset": 16793600 + }, { "name": "vision_embed_tokens.img_projection.linear_1.q_weight", "shape": [ @@ -9900,7 +8449,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 6291456, - "byteOffset": 0 + "byteOffset": 16799744 }, { "name": "vision_embed_tokens.img_projection.linear_1.q_scale", @@ -9911,7 +8460,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 786432, - "byteOffset": 6291456 + "byteOffset": 23091200 }, { "name": "vision_embed_tokens.img_projection.linear_2.bias", @@ -9921,7 +8470,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 6144, - "byteOffset": 7077888 + "byteOffset": 23877632 }, { "name": "vision_embed_tokens.img_projection.linear_2.q_weight", @@ -9932,7 +8481,7 @@ "dtype": "uint32", "format": "f32-to-bf16", "nbytes": 4718592, - "byteOffset": 7084032 + "byteOffset": 23883776 }, { "name": "vision_embed_tokens.img_projection.linear_2.q_scale", @@ -9943,7 +8492,7 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 589824, - "byteOffset": 11802624 + "byteOffset": 28602368 }, { "name": "vision_embed_tokens.sub_GN", @@ -9956,10 +8505,10 @@ "dtype": "float16", "format": "f32-to-bf16", "nbytes": 8192, - "byteOffset": 12392448 + "byteOffset": 29192192 } ], - "md5sum": "3ea1e6cf6a4c4b7f0a2f46b23a3d754d" + "md5sum": "927d59a5c381146b42f03e5e1f514411" } ] } \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin index 3da8dcd2b619ad2c7b461dc1c9ff6e765b034476..8c07c655f2214d74c22925e85c5f38c0ba85f026 100644 --- a/params_shard_0.bin +++ b/params_shard_0.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ac9d4fbf615ae8e355c12f627886bd845dd551ef3968b47f7f5368aada266769 +oid sha256:81297aec4fcde9f701f1aa5c602edca6e417e86d70e563d4b543810030bf5f8d size 49250304 diff --git a/params_shard_1.bin b/params_shard_1.bin index 559b4ecd77c9d1766d67f6962c7966507013fb22..57df0056affc870f76d9b59488e02cf08cea5d3a 100644 --- a/params_shard_1.bin +++ b/params_shard_1.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:649dad831d5eb1b619d66f0be2d2c6fa0db928daecf5559469b09681e7c3e479 +oid sha256:4cb3be86e95443540e1bbb74f85f9ebf193bce0cf65b64e44d51922950753b9f size 25165824 diff --git a/params_shard_10.bin b/params_shard_10.bin index 6f2dfc62d551ea181b7b8e0880f1a235e4b5de6b..298dcf8dad74c6470875e635c08ce0a7f8e7388e 100644 --- a/params_shard_10.bin +++ b/params_shard_10.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1138f3d3f182336adb21ae04536dd3862ad23782b18a53e76efe16d54e8d6131 +oid sha256:2d5576605b34ab95fc447c0e5b1c0a5af977eae8b76e9996b950eb450fc862d1 size 21239808 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..0991ac96fad5c0df60e3f6664835fe3664ff927a --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f29ef3fcc9ba8c66b7d85750451a1066cad22142876e0b0ad1dad6d6d626734 +size 25192448 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb8e8e71915ea867c4d1b5c75ca4c598dbc627ae --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3cb80fac56fa63595d204122751bc048a218f552b3525ee8666e3d5a1a5bb61 +size 25192448 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..955e937d196645c5763bcf8104e57f28284125d5 --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15fe6e0782e6c7fcc2608a620bd532df2c01948210a0ae29a78fd26e08cc8848 +size 25192448 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..7919c7b9829e1cecca0a8e5eb0e7e524e13c0cc8 --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3a6b054e2b0fa6fac22c84b14f9e8e20095648e7fdf00f9659ade781f7e53c2 +size 25192448 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..4af783852328cc823db7ae61b6d2b62d2c94e322 --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47d578479f438d9a57c130ecabbe1bae0bd7cdf78a9b875fd105cdfdca5322f5 +size 25192448 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..470e7982e379ff7da37ffcaa2285c48f77318780 --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654e8815613bba5cae2733c2845f3c169e14c122f621e5341dac054f4ff5eba0 +size 29200384 diff --git a/params_shard_11.bin b/params_shard_11.bin index a1e7b39f9546b53b302550e6be29a155840f63a3..4b4aa7e7c1df7bdea0b72bba5e635fd861016d20 100644 --- a/params_shard_11.bin +++ b/params_shard_11.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9076409be6cc7ace8ca1239f358b876a2d1185995ba937f78ca08b25e8303ea6 +oid sha256:bda0912e2f1d3d5d8af249a6ab48e7844283223aec2c8742fbce3e7b64e07d83 size 25165824 diff --git a/params_shard_12.bin b/params_shard_12.bin index 21a9dfbc3cd3bf67f37f7af031f8b53c2460c511..d36136089bb3afa1f1a7f2347d7fc9bacde165e9 100644 --- a/params_shard_12.bin +++ b/params_shard_12.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3e6aa688763da3039141419e4ba4d6f37576be934f2fd45777d66599a3759670 +oid sha256:b2a04ed984360df1c110d15213ccd686e1a1be314bc3842df30821c12b094109 size 22616064 diff --git a/params_shard_13.bin b/params_shard_13.bin index c21a3a078218cfc5cd324297cc9c59ebb7863abe..ed0d393fc1895e34f25d7358a2d4b87d4cdded25 100644 --- a/params_shard_13.bin +++ b/params_shard_13.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:861f0c3278c34f1698d3fa6430e551a692c117cf0dcaf41f198fcab3c7f3e926 +oid sha256:a00b92fbcfe5e4f75eeb94dde8308162832c8613a319d2b75605c03f753cf6c3 size 25165824 diff --git a/params_shard_14.bin b/params_shard_14.bin index caf5fe0f8bf2dc5233880a05dc1696cba0abf107..5524ee3def343cf23709beadc55a46b2ba6fd067 100644 --- a/params_shard_14.bin +++ b/params_shard_14.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:91651114963a1fa9bd933b76262dbc0f6d8b496d403e1b8671965efd4ff308b0 +oid sha256:455b82cea27e0d4486b8bb2dd147b78ad6174ad28d85f714b551043f5d1e8a24 size 33239040 diff --git a/params_shard_15.bin b/params_shard_15.bin index fbdb35ccab2524bebe3723996d51e713c0f4c549..91bf2a93d89030b7e70ff6ae1c98745f507d32c5 100644 --- a/params_shard_15.bin +++ b/params_shard_15.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e47a30e0c35476945432b23d17066013be5a6a4210bb77406fcf86ab4b00ede9 +oid sha256:2a890edcc59e43538c5c88f1e1dc923e57ccd9d28d412a15ef69315cd0e26af6 size 21239808 diff --git a/params_shard_16.bin b/params_shard_16.bin index 38df10ae38dadcc51837e13f1093f853d10fa8e3..f8efe6b99bef79909d6dc04d1011a0c805d34092 100644 --- a/params_shard_16.bin +++ b/params_shard_16.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5f87222b64a6dcabd4eb0066ddbdc79da701e6172687de894fd491ebc252f8de +oid sha256:fb4514df14bb8853862923c9b95eb3771ea42f4294adc0c08ce041c8ba849391 size 25165824 diff --git a/params_shard_17.bin b/params_shard_17.bin index 8036cf19b90fa670b5713828b80bf1cf5db2ee8b..7ff36bd754ebb8c0888ddf12c34336db1b56f458 100644 --- a/params_shard_17.bin +++ b/params_shard_17.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8a4cd0ea23f069ef0285af7108341e7462de29aa54913467e59b3067ff9c2779 +oid sha256:f2d9bb5532b42ec66293d46b8bcd8798439fc8b3fafafdad47a30d2d3dff3397 size 22616064 diff --git a/params_shard_18.bin b/params_shard_18.bin index dc6bb1dfa3f5631ec7ebe2bcf82277a36576be80..8c36fa200b780aa15bf829fc1c416b04ece27e37 100644 --- a/params_shard_18.bin +++ b/params_shard_18.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:92f9c5816d332063c69ea5befcce556117582ce253af9f759225b1b65a93a611 +oid sha256:14e6ff5e2d2e8c0b69bbc6a673b7fc59e5f5aaae964065cc80cb96b531ea914e size 25165824 diff --git a/params_shard_19.bin b/params_shard_19.bin index 81b031558345bba661ebd8d25ccf9c734af6f1d0..a0672252f32c9369d73b9d2ed846c89a37a9034f 100644 --- a/params_shard_19.bin +++ b/params_shard_19.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eaab1018bcdecdbf93e5e9b13521951c434d224aab0f296400b1c6c1a1c1b363 +oid sha256:5c2ca06b4a15722a6cddf4146396996d8e32611391d116c8a000fd3b843eeefc size 33239040 diff --git a/params_shard_2.bin b/params_shard_2.bin index f11ae4d66aa1b488507e1926f5401fdacee4e0e7..8a2c4dd73b1a0381902df00cef28d2cf871e3073 100644 --- a/params_shard_2.bin +++ b/params_shard_2.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ad54f4f9adaf44aa5848b8cf93b42bdb14589db13d43299f7afbc28610fadfc6 +oid sha256:d770157dfa010ff5b87c86f87fc3c4d113b535539417b7f3959e5c9673be7df4 size 23470080 diff --git a/params_shard_20.bin b/params_shard_20.bin index 7a4e4c516eccba693347b8fb6e3e8955ad45034f..a339ee592ec4dd13890fb673abe94a7fa922ca8e 100644 --- a/params_shard_20.bin +++ b/params_shard_20.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ddbaf4759b2b4521414923a597375d28cef8b153600e103ce3440b7b32a3792f +oid sha256:bf1be0521235bbefb1f8184fe8f26af1d1c58e43cdd0379cbb2cd4ec2d329493 size 21239808 diff --git a/params_shard_21.bin b/params_shard_21.bin index 1a10170011d9ed8e33699b2c9770816b23438cf9..32bd16b3e99e7a0ba4f51f3020a0c8e241785623 100644 --- a/params_shard_21.bin +++ b/params_shard_21.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:97e1a3996663d9e99f97028da08367fb0e64a42e222dcc7fd4a9170bd981c035 +oid sha256:64e6ae6c4299a675e5511d199600cea3db33dac30b97036b33abdabb7dd955b9 size 25165824 diff --git a/params_shard_22.bin b/params_shard_22.bin index c1588944ade293a2e9c36d0a7027fb50c7cd7245..17d77c3ec60269b3eced0f1b4bfc6f91d034ba21 100644 --- a/params_shard_22.bin +++ b/params_shard_22.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:edc0143daf0ea288850e89161342b8278a315eae76792e2a6c8c770a7389b778 +oid sha256:b143e78d1c127fc9eba2ac9da2453153e1a7faf330b93f7f502fb72858b453c0 size 22616064 diff --git a/params_shard_23.bin b/params_shard_23.bin index 34d7417053b07048b550003859651c280e75a72a..137a083d60dc51b91a8263ce21fd811250297f9f 100644 --- a/params_shard_23.bin +++ b/params_shard_23.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ec93c3d9b53859fbd41e9fe551fd4b453858850614e48429e97a2906e2c7def +oid sha256:fadc302e1ae4811fccbf7a080fffd2d21dd415141e18071bc29025dec9f81f82 size 25165824 diff --git a/params_shard_24.bin b/params_shard_24.bin index 77d20a10d162053834687e948631a7d9e2835dee..875abca4285531c5e6f63c45557e7924fa952e2e 100644 --- a/params_shard_24.bin +++ b/params_shard_24.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:82ea240a2a3854cf6285954e90d17f0062571419564f5525c67a641dbb1167de +oid sha256:1475c34e6bf00faebe1fc6781f9ecf2f97e603e03b1c123a9a304d0b916ac6ab size 33239040 diff --git a/params_shard_25.bin b/params_shard_25.bin index 66e4d9b89fd5426e985ba946506292d2edfa8497..d6e948ff7845e060c8dd048cdacc0fff8de04573 100644 --- a/params_shard_25.bin +++ b/params_shard_25.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5a8e163d4da357c46e99839f7000d7d42d6cb62da56a6a8c44f7c5b485daa94c +oid sha256:22f6e0f02a12b29f2ac2ab8ee6c5bfd2127d74bc47ce39d2c9291e2a8b4bf1d7 size 21239808 diff --git a/params_shard_26.bin b/params_shard_26.bin index 52f015f76b53571fd90ac7bb65d86c9e7e9fbec5..065d643726fee81ee5ad372ef07399a97da58fa5 100644 --- a/params_shard_26.bin +++ b/params_shard_26.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ec9ac1c558779c7205169e9a7f2e707b4b69d6f95783e5825ac1648efed86c05 +oid sha256:fcdeb372a63465619f978504a1f117232b310490b35f2a39091d026297e75209 size 25165824 diff --git a/params_shard_27.bin b/params_shard_27.bin index 8a63072e7969455e08d6d34112fb9fceeca17553..b964f9f762bbf5ee60539d0fac7319a3e53723aa 100644 --- a/params_shard_27.bin +++ b/params_shard_27.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c01edb67a24f05dffa49b4d1f4e99a0daf959af979f4a9d96de59f9898683b51 +oid sha256:bd9a8fbf49f3ba652d63c42477f09aee5642721cf04d211bf1e19bce53585b53 size 22616064 diff --git a/params_shard_28.bin b/params_shard_28.bin index adf350d5f8f63a798d96a6b5cf1d232f26ddb1b7..10638cf5f54a322bcf044eb7e13a67e089363bbc 100644 --- a/params_shard_28.bin +++ b/params_shard_28.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:de7c43ac1d3a4ebf1f586e9ae2274d9dd392bb31a8281bc54c10968a21364976 +oid sha256:7d5c3107d6faea1f075ccebb8d6775633b60ba9878e8aa942b794164b046e848 size 25165824 diff --git a/params_shard_29.bin b/params_shard_29.bin index 35e17a220b52fddf598d13be8f25beefe7114238..89e75e337a3f774d9524cbeb2765043387bce730 100644 --- a/params_shard_29.bin +++ b/params_shard_29.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2f81f1c8143ba45885268ba9c1013ccea18c6c490e447d5a9d8d57b60a7ff9cb +oid sha256:711d12ebeb1e5c9b9bd2d5ad1b03b7afe23596e7ea420ccd8770844c45c1c81e size 33239040 diff --git a/params_shard_3.bin b/params_shard_3.bin index be62af73ea2a0e34b61b81577815ae56d97e0633..a9e87023f2077b12042fab5bdac700996c7d4995 100644 --- a/params_shard_3.bin +++ b/params_shard_3.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aab2f1af66c00cd96189b0e96882df72a9f2b46f0b0371271a205d13a8285fb3 +oid sha256:3dba1d1e8c1ef52483cf1918128b24c21d47d1ecb7df76e776e284d8207118bf size 25165824 diff --git a/params_shard_30.bin b/params_shard_30.bin index 132f4865d696266af7828c8678a4711633b960c0..a91903376efddd450f18185523df3ceeb17f7b2e 100644 --- a/params_shard_30.bin +++ b/params_shard_30.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0914106ba25c70592431cec055100d4f2b78f5dcb51827c257a60506d3580a0b +oid sha256:9c2497c7ab3b54273e3ede4914b8e1824dfea1654c9f38303bc9d6cdc5838b3c size 21239808 diff --git a/params_shard_31.bin b/params_shard_31.bin index a8a20e2f6eb9f1e02c3d0f74010b762c1692516f..11fbf78cc3b6cf04f68ac83fe2ef71e57d01ae62 100644 --- a/params_shard_31.bin +++ b/params_shard_31.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:65799beb75bcff7785468d67aac61cbef5e3d879fbdbe9c61f4874f31e72db95 +oid sha256:041d1acaf61a8a9d7a63d65676d08b6c553554b2fa822d3d9408dac2c1548b04 size 25165824 diff --git a/params_shard_32.bin b/params_shard_32.bin index 940cba2b5396c815b2b4388dd0844c1138b40bd0..a87cc7223f1e9fd29a184dc4ef8c6ad2d712c999 100644 --- a/params_shard_32.bin +++ b/params_shard_32.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b08b017c359621513ee7910202aefdbe0d3e5caf7872221f6c9174030a5fccd9 +oid sha256:28324bf9a531de0523cf62069bc12601bba29416be2c59bbbeefae1d465d0624 size 22616064 diff --git a/params_shard_33.bin b/params_shard_33.bin index d806d9c98cc2c7ed9d1d7b466f4601a403f714bf..ae33f1f3c1b7b857be1847e3e83b169a4e423ad9 100644 --- a/params_shard_33.bin +++ b/params_shard_33.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d7405648d486d14f240e1dd4fa89d026a9eed38073463332581cf395326a7fa1 +oid sha256:05db6c2f05b40540e537c4cec4d2d387f97d78a7ff526eb477c828fba1da9073 size 25165824 diff --git a/params_shard_34.bin b/params_shard_34.bin index b27717d5ff697a3b780dca8ccf7eefe28b54d9c9..efe84fd8826b8f6870bfa8321f07c119ed0a90ed 100644 --- a/params_shard_34.bin +++ b/params_shard_34.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:94d8fdb47f5ea2bd00e788923ef1fafee5976c3526455aaf1046901e03b1c50f +oid sha256:cd7101261ba97e7e7e5231826dad79d58c5e3b0559d8dafc8e1cc86a3e4cd249 size 33239040 diff --git a/params_shard_35.bin b/params_shard_35.bin index 4c97bead69630e6c2760f53706d91dc2e08bbc72..00e8659d3142cb07c74135a304800a7d5a7f099c 100644 --- a/params_shard_35.bin +++ b/params_shard_35.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ab8f5a671b4fdfb12659783fc59caffab9a16943dafd880c07712f452a6b3eff +oid sha256:27fc97aa15240e94e85e05f1cdb424d7f914d17fae1e7d76a308e83a412b592c size 49250304 diff --git a/params_shard_36.bin b/params_shard_36.bin index 9da2a16693587a30b74e01edc121461b8c7d2edb..c2b97d99072ddb24e582d4765625f6eaf5686b15 100644 --- a/params_shard_36.bin +++ b/params_shard_36.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f2005fd4875ea10fd5df9a5b9a39d7af7e5cb859664c740db9d25c450825fadb +oid sha256:4537bac1683c57ce5c460ee5c89a22bf45470e2e4c61839b50867445cb16c3ae size 27402240 diff --git a/params_shard_37.bin b/params_shard_37.bin index 8ccaea6daa1dbe1dfede4f38a1dfc8dcc5d1e7cc..cec6dea1e233ed24179139bff1fa42dddeb04038 100644 --- a/params_shard_37.bin +++ b/params_shard_37.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bd53295cfef825ed58d57a38613c045287c061ebcf7024f2d1935779750f1165 +oid sha256:d2063f087de81d486a84202db6b6c515723557cc59449b181930de10baff2d0b size 25165824 diff --git a/params_shard_38.bin b/params_shard_38.bin index 717e69fa34ac36ff68b4a8488aae3c778b6bc3e0..bebbcb9dc7b1f938a2b11b2de50ea61e30dd7062 100644 --- a/params_shard_38.bin +++ b/params_shard_38.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9b5beae2786a6c1152724680a40f9fac98e53ac59da7d4d7d4cd07459aa1e640 +oid sha256:17b368d41a904c9ac97c6c5f33726f6725ca1964ce9ec39ff50aba62e08175d7 size 22616064 diff --git a/params_shard_39.bin b/params_shard_39.bin index 18b318d1a53a24873f3a37dc8483552c22eec72b..5ec0d72922aa0e3cf4fbf79789374899f8dd37a2 100644 --- a/params_shard_39.bin +++ b/params_shard_39.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7dcade22609700d42c1d15490de203409c39d60e834b319fa9d5bbc917d705ea +oid sha256:aa297df7af5aa2512d729398f574a429bcca6c5c0248ba526443ebccbd6719f9 size 25165824 diff --git a/params_shard_4.bin b/params_shard_4.bin index 3839f6c2da0a38cc883a78936684a5bd5fff8d81..06232b052d385b59ef8be3e9e66fa7450ad6b73b 100644 --- a/params_shard_4.bin +++ b/params_shard_4.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c4fc7a726b65a551b4eaea4703b63617cea761a900b1d7b1f007d20c6de205f2 +oid sha256:6598c58bb43df623984ea9c9c9564cedce5a9039a049ee4d14e730385c99578b size 33239040 diff --git a/params_shard_40.bin b/params_shard_40.bin index fbe5e461e88ed215fd206a0dcf9c796e97ed2fac..13789a6772e2c93e2563b726033e25b0d2230ad3 100644 --- a/params_shard_40.bin +++ b/params_shard_40.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e642fb98a12789b31106a2e8fd01aabcaec3a516ac6cc049050f133e5f813b85 +oid sha256:59f7ba6b7fcd7093fb9393a1d7a3e307d1ec70add8cb2d7858decd0e4789f0a1 size 33239040 diff --git a/params_shard_41.bin b/params_shard_41.bin index 5eedaf5e594dfe86e4b4f3eaa57d25ec34e1ac5d..b738262ee927788da856c80afa59f7023b6d08b3 100644 --- a/params_shard_41.bin +++ b/params_shard_41.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:edc6d7684682df94b5561a5ad38785d2e7c201bc8dd0b10afd212f159abd0c0a +oid sha256:02c449a9ec999c01bae18f98edadf921d869d004817a7e153bf6988ccbc9d7fe size 21239808 diff --git a/params_shard_42.bin b/params_shard_42.bin index e37614e6b109b65bd5b3f474f1d164c0ee341444..a6af2ffa5258189b40e83bddd15f2e379f2482ca 100644 --- a/params_shard_42.bin +++ b/params_shard_42.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5566d064524618b63054b84d1c5b169cec5a0a95480bababce7ed8e820aa1e59 +oid sha256:dfe302cfa588fe7658a15cbb3cd3f942483f102423d39c249b5ecc36283eb74e size 25165824 diff --git a/params_shard_43.bin b/params_shard_43.bin index ff380290abf4706de1cbfbfc2bb61a30c3e9e028..26f9d20da17a843d75c4a284a2a017073b5f35a2 100644 --- a/params_shard_43.bin +++ b/params_shard_43.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:798e26e669cb907437fbfe12c0e4f6b499f982029f8acef3aab1a31b68d3526b +oid sha256:69c724d49f53f789576a9922f6878c981100812bd76c3921bbef181214042041 size 22616064 diff --git a/params_shard_44.bin b/params_shard_44.bin index 9eced55aca6120dae686b1a543f65fcc9b81e0ab..e802814cc2f5ef001c6919b527238791cb230c54 100644 --- a/params_shard_44.bin +++ b/params_shard_44.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:357a9f183b2fa49134d42e62b598811293feccfb67e3e7246969a9b4247d14ec +oid sha256:a6cf37fffe1f9658b913b862d73c15af69c0779681c04e457af355bda9e6a2b3 size 25165824 diff --git a/params_shard_45.bin b/params_shard_45.bin index 39fc3abd2968b0377a8420a86f81917fc9229ac5..e7412d05868c46040b22559b95459538f7bf0bd4 100644 --- a/params_shard_45.bin +++ b/params_shard_45.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:97a50d88d1dd32b74c0c7a4b27b1535a1bbfd62b6a2e5c23399ffdaec71423c1 +oid sha256:12d1beeb01f480fc8dff50a2293675b9a02393fbc96b588d499d2696bbb24ae8 size 33239040 diff --git a/params_shard_46.bin b/params_shard_46.bin index d8dad5bb7bc586f128b47508a7e01d5a4f72a9ce..2067a3c081ee5fa272a764a2cc0b736907eb09ab 100644 --- a/params_shard_46.bin +++ b/params_shard_46.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:788ff75ef31f65fdfe1bad29b83dc5cbd02c51d4aa0da4ef8907916f21951052 +oid sha256:b97b34e2fabc826ffc89e169984579d0def4e5d01fb5194ec722e53ffff39845 size 21239808 diff --git a/params_shard_47.bin b/params_shard_47.bin index f0fd46ce4a737f2a1a09d7573a3b87a704e78c51..9fa0db8aa9d28e557943e55d251122d5fdc70c61 100644 --- a/params_shard_47.bin +++ b/params_shard_47.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4c5ecc000c7cb9b74cc3bce1d93324e6a3ffbf1faac8f45affe567931b4c0321 +oid sha256:f8625d19570c385182a01e20d25d5f656bd647b57c047c1d6f0f0175e260f771 size 25165824 diff --git a/params_shard_48.bin b/params_shard_48.bin index e79e0dab4c669440f6f437da4cb316084ce182de..cafa15d45868ceb62044712fc0f707a7238da2b2 100644 --- a/params_shard_48.bin +++ b/params_shard_48.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cf9a5975840a6cf6e4d1217935c1269c07559baa7d28db84dbbe99941c1b2cff +oid sha256:8596eb7769b853739b18508ee64bdbbbc59735de5ea556456e8d2ada35e5f1f5 size 22616064 diff --git a/params_shard_49.bin b/params_shard_49.bin index 7c86109a457cef37a45eb32b46a7044669ff6d82..0102f7b1d341495c77e5323c964bedc09f383d08 100644 --- a/params_shard_49.bin +++ b/params_shard_49.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:82435042c029c6c701b1edf2bbe2b08762da1b5e22137fc6353a8f97e028e3fa +oid sha256:913d133aab879f9ec4d18d7b9c0f8eb9de6bee30422f90896f72d712e3268d7c size 25165824 diff --git a/params_shard_5.bin b/params_shard_5.bin index eaab733fd1f4cefea349033636baa2f49ceda6d8..22e45489c7e6fbb8d002ecbaa10e7c697d326790 100644 --- a/params_shard_5.bin +++ b/params_shard_5.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d45a103f2a37247815da2b941128e9315c6bfef266f7af92ac599ff2a89fe64d +oid sha256:c5c505ebe3eaa95444114cb94cd600d8855383f1cf21564aa63c69b58a9ea11a size 21239808 diff --git a/params_shard_50.bin b/params_shard_50.bin index 43ade106777628823a7ab169e5f2d851f8f986b4..b4225b40a10fd9943402e90c74ecfdc22fd3d69d 100644 --- a/params_shard_50.bin +++ b/params_shard_50.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:01ef30751bf30d1f2f80493da65ddccac8470398416dccfa401a2b54643402d2 +oid sha256:74891bad49528f546b29f84a2cb20ee873e3d6219b0e48f361cd04ab85e997ce size 33239040 diff --git a/params_shard_51.bin b/params_shard_51.bin index ad82dda685dcca4b9ad11249497c128e2104692c..142843b7773bf2ee016313566d28d19ee52e2aee 100644 --- a/params_shard_51.bin +++ b/params_shard_51.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1eec3cacd25f5f834c6108f37d9389929a19fabbe1464ad0ad47e76a74d3c534 +oid sha256:758cd02ac7f65e3ae4484198c11638c00ce934702c2f084a1378de13e3faa29b size 21239808 diff --git a/params_shard_52.bin b/params_shard_52.bin index 4a54a6c587c5f99e09e1f2b23d128aa293c8392c..4bce6a39b7ea5e9eda1a82f94d2d3176bfb48565 100644 --- a/params_shard_52.bin +++ b/params_shard_52.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b8456cba6848e7a2937d88b96874f876dab6b7563ad6a16a534eee2ddad837fb +oid sha256:a3fec89919268d2b2b5a5d01b8606a7787386677392f2c12ee9da6840e29d18d size 25165824 diff --git a/params_shard_53.bin b/params_shard_53.bin index 686206034b5b26366eff03b468359a70ec72f6a7..6acd4062e29604bc828edbfefed22689356d1e94 100644 --- a/params_shard_53.bin +++ b/params_shard_53.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c1ecd78c7073452475d13765ac802f78618537f925241b7b459ce5267d1c6ce2 +oid sha256:65de4700bd0604be012481ad1f8fd104dc8c2eb68aea3bbe2180ff1475cdbac1 size 22616064 diff --git a/params_shard_54.bin b/params_shard_54.bin index 06f41819e45c6dd0640a098fd292c51a31d05a70..b52ba0df2f0efaa7f141dfce6127417d48a0bada 100644 --- a/params_shard_54.bin +++ b/params_shard_54.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ddf603abe24538410ec9c441c8552d27c76dcdf492eb699710a0170a9ac7d2ff +oid sha256:f7164ff69ad4e748f4bdc040a0c5bb10949b9e7989d39583713726a050c79d02 size 25165824 diff --git a/params_shard_55.bin b/params_shard_55.bin index 95afd3fea3c822498c9d2b5bce295838b3d4cbed..ea16c399a9b5833d4030efc3df29591224252213 100644 --- a/params_shard_55.bin +++ b/params_shard_55.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:828a79889724295438821dd4a66fa2b2b2f4024f1adcef60b86860aa88a1bf2a +oid sha256:e771068302f62bb9ceaebeb84e0180a724b9011df4684c44b22807bb0ae5c678 size 33239040 diff --git a/params_shard_56.bin b/params_shard_56.bin index de2660a7759e6714f8df60fae0ec6599ce5eada9..9590eaf8ec7bc9285cc29fae1ec5edc6402d550f 100644 --- a/params_shard_56.bin +++ b/params_shard_56.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9e6e4f1b5d0dc57416b12eac8a6e2543d1620645479e75c9be398e234a37f635 +oid sha256:7f834d60176bdb4b692c5f2d3c41b037a4d57e4df4aac845699053a21decdf00 size 21239808 diff --git a/params_shard_57.bin b/params_shard_57.bin index 221a8df35f48f5c2969c3e766bea1ab50563d8d0..7959844b71feab4639fb7c46bc13e30fe6be10c3 100644 --- a/params_shard_57.bin +++ b/params_shard_57.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9537e10e71ca0ce18a9f37e402ea4afb19fe2c287e789d5082db14a595cff0dc +oid sha256:cbb894bba7f749d098b5ef6d187fce0a0a40ee7bf2e88ee494098132abc94b8a size 25165824 diff --git a/params_shard_58.bin b/params_shard_58.bin index e9f32edb1a9cf50bb5350de2317e6a750a58f7f4..b1785277e49debca2f44ede2f7bca24c7e098135 100644 --- a/params_shard_58.bin +++ b/params_shard_58.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a5c64d62853e00bdffa3f2b99cd0a1b55fa630df467baeee8e9e9abe756a06fa +oid sha256:cf1913191314ea4dba5bab1e75d7d0d467c0d9f40c9f04de22e4a698f488aeab size 22616064 diff --git a/params_shard_59.bin b/params_shard_59.bin index c5876f6f0863356e3735b9a502c5264d80937dc4..0fc326b6429603afa00d85e48052ad5fc38c8056 100644 --- a/params_shard_59.bin +++ b/params_shard_59.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:835716d505badee36fd76fe8254f2bc74625be6fd1a38e3f6f0888335bb67e84 +oid sha256:ba985d5c68da37fa7684598afd993c98fc0f9015c5e18aaac946acd1dd2dccff size 25165824 diff --git a/params_shard_6.bin b/params_shard_6.bin index c2f2641c0f68994792d31847cf504f690f697492..7565bf768128cbf207b83d3b0339ec67618d9a68 100644 --- a/params_shard_6.bin +++ b/params_shard_6.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7425be230b27192e9ed2d17fc6a4a71837fbce67e3d6fff088ca72fb69701d25 +oid sha256:d03a744289ff86513d2c739c41bb8d17fb4fa17dc37f906dda1de3bcab230ad0 size 25165824 diff --git a/params_shard_60.bin b/params_shard_60.bin index b3b6c47e15672cb02852be731d7bfd71a0cbf579..3feabd4e3acd697202f818841b41506cfd4c11c2 100644 --- a/params_shard_60.bin +++ b/params_shard_60.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c1f4c308bba19f8bff5cf1d6e82b63a2808de62c3f1d10b6e2f714de46d16af +oid sha256:89d1222df8e52e2edfc552b82584be255e78e9504dbd38a61468d2e310b0168a size 33239040 diff --git a/params_shard_61.bin b/params_shard_61.bin index 259932617787c275d7be71e85a83bd2e6810a0e6..527c1abed38c304bac220707dfb08f0f77336982 100644 --- a/params_shard_61.bin +++ b/params_shard_61.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:681f0bdb2b063b7ac9fedc7984cdb4750e241bfc4f246bd6284f8d8828e5911b +oid sha256:71bbc16e8e6c1e1b3f997de5d1a4bd0665c8de36816d3c097c371e214a12f605 size 26548224 diff --git a/params_shard_62.bin b/params_shard_62.bin index 24c5a58c00a0176ecb7e522ef99c58d6b98e9727..4a42ffdd347d7892182143569fdca444ba66917d 100644 --- a/params_shard_62.bin +++ b/params_shard_62.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:87a1ac08ca46a2a500790d2fef7e24b9be4451e07b0baf149318d4d46ef96f7c +oid sha256:a0b48f91288269d51ed4a403a373afa288f6776facaa754eec9e0d3ca19517b3 size 25165824 diff --git a/params_shard_63.bin b/params_shard_63.bin index bd7f11048463de2b77861dd078b3107a46c4323e..7e81599b0fff3dbda88106a86a731215ef905d90 100644 --- a/params_shard_63.bin +++ b/params_shard_63.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aace00cab681cd0e9c82eaab9d3d55413ab193de4911714495c1dc6f7fc7465d +oid sha256:ca51a23de95dcf1a62ea2756b5163b9319c3692e34a937650df34f562c882c20 size 22616064 diff --git a/params_shard_64.bin b/params_shard_64.bin index d1c0e73efa5d661d32ded83ed5a13128782d519e..44fbbe26c8407b656bacee15b7abcb1dc298113c 100644 --- a/params_shard_64.bin +++ b/params_shard_64.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4629d801f43f63e83538478ab707f798958a7c85c310742dffd53782d22fd071 +oid sha256:f079b19907786d8cac2b0aadf747b45c13ca659dfc93ff260413e1c117c43bd8 size 25165824 diff --git a/params_shard_65.bin b/params_shard_65.bin index c6eea96442d3c0092867ca70a7c2f4a402932b7f..5d1503148a8b92e937b20140a7fb8952ba43144d 100644 --- a/params_shard_65.bin +++ b/params_shard_65.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8466d291bf2f92a7d5bd6621012ed6586ece4e75cf37e588363b1e2ebc8a7917 +oid sha256:73f5412853579363917337ad65c8a201e1ffb05b5ed962d6b85a2556d88eb01a size 33239040 diff --git a/params_shard_66.bin b/params_shard_66.bin index 46c9eb4358176b808101bd6bd7ec980fd844691c..4499b98ab5f5eede5cdc1f5357b5a4dea8a0c1d9 100644 --- a/params_shard_66.bin +++ b/params_shard_66.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00a619830d637770c68aa03a4dcddae4f2b6c6a9cc7ac5722cd9e6a677708c60 +oid sha256:c4b32abe15921cc556b32096e398c3876689752afed0eaddb445c3eac8347f31 size 21239808 diff --git a/params_shard_67.bin b/params_shard_67.bin index c4b55251ce5c9f4e7ad680b030b61c8543582227..7d574fa37e66797b83ed63b7b7732062ef96b4ff 100644 --- a/params_shard_67.bin +++ b/params_shard_67.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fba42f8f14768e0d2e2eb9511027876868fd806ddd031c6aa380e31774a60a51 +oid sha256:b3864f3a3452fbb183a4ea4449009b4f0110596e290e967257cf40139a6081a2 size 25165824 diff --git a/params_shard_68.bin b/params_shard_68.bin index 440b435374b45c694772f8ca27c380e90d442fb1..7723cc1a29ed05795b9061e495a5b1d00c128b88 100644 --- a/params_shard_68.bin +++ b/params_shard_68.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3f5d43ed9c3675f6ec741a3e95ea6a70c4e86bc08b115d9081a94b63ef7cf2a4 +oid sha256:1ae304e7087a35ade6528c51b26b4a6f85e1eb7b44012e01212c8d36412e1c4b size 22616064 diff --git a/params_shard_69.bin b/params_shard_69.bin index 9b4a5de9dd8a470900587fd40450793f4b23ba4d..689e578f81b09a7a19fac44427d075a745bac838 100644 --- a/params_shard_69.bin +++ b/params_shard_69.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:091dd0894cb175df5eeb56d794814ed1de3824a6d9e50fbf43e8d9684e967924 +oid sha256:a7e0ddb98e460dbd4852d2c0fa51b4a34512a5bcea72d5dc41edc649f29b47bc size 25165824 diff --git a/params_shard_7.bin b/params_shard_7.bin index def01351206fc94308fe0ca7757e47f8bec04c26..aa0088e9ebdbb96ae539ba53e90f358396d8b7ca 100644 --- a/params_shard_7.bin +++ b/params_shard_7.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:384fce109e98b01401984a1d38207447cd054057d28230cca057e15dbf389a16 +oid sha256:505893e3e5d913165b8f98c044a14bd694f21ae88b6b3f41f9f4e5651ee53deb size 22616064 diff --git a/params_shard_70.bin b/params_shard_70.bin index ac21a5fcccac5033e14a5caa18d07e3543ba7a4f..8a1ca085b85aeb3aabf24abe75a7de4d19bfe00e 100644 --- a/params_shard_70.bin +++ b/params_shard_70.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c3e1fc2766c86c09c7f809afec0509c2f3183e1222cb589f8cc77b9cc932b332 +oid sha256:ef3177d6aeb3180d9023c18fecf2816a369dae17fc897cf561abdbf16a816d8f size 33239040 diff --git a/params_shard_71.bin b/params_shard_71.bin index b7a2b8ba11e40d49a24faf63ee0d05b4ed3da897..16388c294e45e674159ee4bfa70bab88d4de22fc 100644 --- a/params_shard_71.bin +++ b/params_shard_71.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b207606e41e26699ccae6ed485950e0d4c175a09e70dc25c6b875fa06e7cbb94 +oid sha256:790999d0965b27ab637c0a0b926d01823aeb03707087801ed7c6f6d97c7c6b06 size 21239808 diff --git a/params_shard_72.bin b/params_shard_72.bin index b88e126400d7d48cb030f658ca170704a44acabe..1947caee54d6b0f60913cddd7c98c6fdcf34c731 100644 --- a/params_shard_72.bin +++ b/params_shard_72.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:041232a9b3819d390b1c767778791d6074d1699117277943b28b66f16a0b3305 +oid sha256:2a639895764f60ddd4f334c11a2eacf311537fb8f99aae6806f44cf43249c82f size 25165824 diff --git a/params_shard_73.bin b/params_shard_73.bin index ea5c2c302c6724368a2d7afb4dc2a9d630e2f658..e07f93c9d41764c70263e6ddbaf9d1e9cf315f72 100644 --- a/params_shard_73.bin +++ b/params_shard_73.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2d89a9ee79c188f473ab6b355a84ce1c99131686872513e9901b58fdd284d7e4 +oid sha256:153bda9a2a205922e330beb7017cb427731c0e37e4b154d98ade0984895439ec size 22616064 diff --git a/params_shard_74.bin b/params_shard_74.bin index e6c8835a724bbdfbe5f8896272bf1d4e54c764d3..c259b00a221f8eb075bf1c61c01d40212a2e3113 100644 --- a/params_shard_74.bin +++ b/params_shard_74.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:aff5363ab20de93229218bb56548eaaed3910f1e809c21d853d3ed214d1d5df0 +oid sha256:52f53d5c2cf9149c00e74e59f2085e7816b4626b3efa684dd8a3f4c70ea54c4d size 25165824 diff --git a/params_shard_75.bin b/params_shard_75.bin index 223c2df6474e731bc134100f7d5706c6c6ef453f..5025e0752fa7434fe4591e4586a8c8441af1c9cc 100644 --- a/params_shard_75.bin +++ b/params_shard_75.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f8294b3c0eb0e4b178c5b7fa294c2434f336c29ae24c369ce6fd77b3070f4f77 +oid sha256:d6ba29aab4292ae7a29cdf18bf0989993cbcda58b01133354c5f32b7452f42c6 size 33239040 diff --git a/params_shard_76.bin b/params_shard_76.bin index 8a79131982d31eb4508e4b51ca5247fe94e12dcf..cc403ae8751bfe136ace8649e2199a0a9fff7928 100644 --- a/params_shard_76.bin +++ b/params_shard_76.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0277d1608d39282ab2d3823e7ff86796b2a562d4b026b96410090e1526c8293a +oid sha256:b3c37af494b0c1e01867100f2d8c7c5122ad010ef62565c9872586fea1fb1b32 size 21239808 diff --git a/params_shard_77.bin b/params_shard_77.bin index 8c94101968f8ac306b0fdce485a2384e3b2554f0..34e1fab637631cee9abeac155470dc4e9eec977d 100644 --- a/params_shard_77.bin +++ b/params_shard_77.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1ab5bc05811a46011793880ad29a2f06b726c49283746ceaf0e3fc60118b1200 +oid sha256:5fbe539e34af2e25c45e7034de4f0d255fcb73ede4912b8b4b4e1107e3f006ce size 25165824 diff --git a/params_shard_78.bin b/params_shard_78.bin index 294a1165e1808a6eec5c0794a5ed3c5a96196daf..2f31f4b8a763753ce663a8027fc1dbb8f5d951fc 100644 --- a/params_shard_78.bin +++ b/params_shard_78.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1aac0fd996b19a1784d4b855fdec6684b730307ced70093c1c66f4efc1eb3e38 +oid sha256:0d9243124b5e5e67319ca5a84b3d43a58ed25aa6a4b520c03384868cf0bae306 size 22616064 diff --git a/params_shard_79.bin b/params_shard_79.bin index fb0e06f58cf568c5d87a2fef279f3235f942d1ad..52841105927507925b8829648330a2418fd748d1 100644 --- a/params_shard_79.bin +++ b/params_shard_79.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dc2543785e8444975ed6127428fc2cc00cfc5e4da7e8c04dc93d9d311adee9ea +oid sha256:773adde5996a8672767f99b90edc48ee4cdffbbea45290ed9d7c5e7289109ee7 size 25165824 diff --git a/params_shard_8.bin b/params_shard_8.bin index 95d3c821851d33b12ed01d424b2d4d6136420564..8a81d1749f17c039dae17d4f67b22c732695aeea 100644 --- a/params_shard_8.bin +++ b/params_shard_8.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ab9ffb27c18e769343a93f175da71a205bb583402ab9fa00a23ac132abfc1830 +oid sha256:d13db7d0c891683730db5fe3cc80acdb16c9042a01c4a5a9b988b40571e79057 size 25165824 diff --git a/params_shard_80.bin b/params_shard_80.bin index de5aaf752d024cf33103f8de4f0ad719b42ee183..89c6583e053bdb429e28d9f7e00e2d02fa33f73c 100644 --- a/params_shard_80.bin +++ b/params_shard_80.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e9c74f482fc1cbaa9341f37ee775843194ea10a1c408e3a2328f909759326e1a +oid sha256:55d29a96097f876d3a80b59506f6ef246d1827b419f03b20df4ca9f115604cbb size 33239040 diff --git a/params_shard_81.bin b/params_shard_81.bin index 3df1fbc5527cda9d5b98ef12515e406b45cb45cd..58d167e1e46a3cd832c5b0ee2b5d37c298d58790 100644 --- a/params_shard_81.bin +++ b/params_shard_81.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:74e5f281da70393d3399f55c0e66a512af77c0239f1a8f1b353b5e4ece4cc986 -size 32262720 +oid sha256:ed6fd161ef316e97f12b0198574443d39911cede7fc4bfe9f0bd25d3d1ee1e55 +size 32036864 diff --git a/params_shard_82.bin b/params_shard_82.bin index 0957649043a8da22abc6eb86410b54c5bfd6aa14..59811b282fc7444ac981a47824ad41bce4939b94 100644 --- a/params_shard_82.bin +++ b/params_shard_82.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ffd52ccaaac0201765132ed9a2a1d646fc1b77f4fa08c657f270b168000c6589 -size 33161216 +oid sha256:95f92d7517fff429ac6464ed3de54b841aafd2e1b96485d8edbcd6f0f5c9892c +size 25192448 diff --git a/params_shard_83.bin b/params_shard_83.bin index 6684169e92bfec9faab92b7541992a00cf6797e3..d4459fd39922dec7c841f7b8c4fc14cf554e6364 100644 --- a/params_shard_83.bin +++ b/params_shard_83.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:62b26d1c9f00ab5ae9a6d897e4630017dddc0672d8ef7c52617e4eda04d06dac -size 33140736 +oid sha256:2907f5074bdae488baf0179fbd0d3a9703b8925d6aa26c19072cf39f30632a52 +size 25192448 diff --git a/params_shard_84.bin b/params_shard_84.bin index 689c2a66c22764da73bb8c9423e07ded168e2f06..3a09bfb8ad77f262966a65a055c39cb93804bd4c 100644 --- a/params_shard_84.bin +++ b/params_shard_84.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d0e4fcafb3bc91e90db4cd991e3317c3c31727daf12b0c80c34e5e654ff5c7f5 -size 33161216 +oid sha256:e52258f6054bfd1e5a63f3009d47471e6997e28b096182a3be103002625e7b5f +size 25192448 diff --git a/params_shard_85.bin b/params_shard_85.bin index 31b30c54c1bce21250301881d1ab1dd0090b7f2e..99688b0c0db89f44b28bff638c846f0db53e719c 100644 --- a/params_shard_85.bin +++ b/params_shard_85.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c408c01882691a01462a07db75e166c5bb40d55856b747964bcc48d6ea4970e8 -size 33161216 +oid sha256:dd9acd6c014a0e3e3a897009cb53798fc88b404b1716927528c983fb1c209506 +size 25192448 diff --git a/params_shard_86.bin b/params_shard_86.bin index 314e102d52384564e191bf7cd04d244486b64e3f..8feb427823459689c69aa930cab2a23292327a4a 100644 --- a/params_shard_86.bin +++ b/params_shard_86.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:19fa26bb363e8e76010f4c80cf255fe33a8657db36a0f20046331095f562f4c3 -size 28416000 +oid sha256:b98c509c9dd6d2d651ce561a1b40b9ed54da611a1dee3b301939ce644f8ab5f4 +size 25192448 diff --git a/params_shard_87.bin b/params_shard_87.bin index b5c265765255a28ad38396c1ffb5959781d489e0..5d23a29ba623e1bd9cf07a33ec4fc4187cf240f7 100644 --- a/params_shard_87.bin +++ b/params_shard_87.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e670059e7b1805d8a9b13bf76a499d7f1bcc6639b36f64b9761f3a8a952a5970 -size 12400640 +oid sha256:a393ae05270bacd4e1bfc159c658dc0c2d120c62b74814ce0dcb4e1dc6adbb25 +size 25192448 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..72f9664df124f76c21c700903e633730d1f752a2 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:961c95cae2217b3f91ae66dd5bdd217a3786570e08e92526a0ed1e31a9d0a26d +size 25192448 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..98c06b0966c3bdb1b9fdb1479b91754bae3ca839 --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa58db84fbc3b6cac71f8d43b11ebc7ea23514a9759fb642c4424107ebe52ef +size 25192448 diff --git a/params_shard_9.bin b/params_shard_9.bin index 2f6c59788df92e8dd55d2f9a899d5d3a64cbdde8..c2dd32b9b74ceecfccf4514e57714d9794f92c8c 100644 --- a/params_shard_9.bin +++ b/params_shard_9.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:39843375e2e47925a10b9ae7224822b4e9ab533f66bcf095a6006ce7736b92c1 +oid sha256:9bd8cb9d9ddd99f4aa3ce471e3eb5e5cc0e2838ff3fd262c47369b06f0f45998 size 33239040 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5f3a209d8fea02e4e3b71d5d4a8753800f04b4c --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe8b445092c0315182349dcad54cf7152c561d2238ae565e740576c766da99b0 +size 25192448 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..4351b9bab50d16bc35d02d66f1a957cc48a9b0bb --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44419c11afdfe4a06d2fafba5568f054aa4d01d580291b9d5978c36951fa14b7 +size 25192448 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd692928a5e2b04d81dae5f4ce877fe46b39bf12 --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe50070e333c5844a40ba3a6961a2164c2a15fa53e554848d4f0c7d1819c819 +size 25192448 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..15df2cd29ab48348b42c74fa11c4ae4e546938a7 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c8111bddd12144adfa3a8dee1a21d2c9134f5f94179aefac6d3d6d5a08eb623 +size 25192448 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..767cc22ad290c9e6ef407055a0957afed85a139f --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3a20952446e3802dcd8392cf071e9d5427d1287901517af125a7bcb6d68722 +size 25192448 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..c499622903ea5bca9e07a1cd29211976deac6361 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c10de3efd24198d9211e04c07fa0589647f24ec9c2b23eb79c05b1c03913e77c +size 25192448 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..27702db0ef554ab6dc3b1cfd50382fdf89a86644 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25823a9063b8218a1d3d11d18be96984a5f798e8efc1ac26b97083dd369c308a +size 25192448 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..efe41e5de5cadef2fd1f04e22ecb210a5ab0caac --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f917a43ac21c3f03b0dfb3c3ca797dc6e95da24d37659e88d823aa4cd948ed5e +size 25192448 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d0108c8f2d520525574269cee045e3f3c9e1de8 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dd89aa87467417fba324dbc57251fb8af684b86da3dd5ff95fab8eedf31325f +size 25192448 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..b61a1190637f49ce4ffeedbe07da73ba69efb144 --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7957183ff6d4b77bba3b349158d2d0d3c5c0059140f0e6dc3836ab2b28fd1d +size 25192448