diff --git "a/ndarray-cache.json" "b/ndarray-cache.json" new file mode 100644--- /dev/null +++ "b/ndarray-cache.json" @@ -0,0 +1,4459 @@ +{ + "metadata": { + "ParamSize": 327 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 65536000, + "records": [ + { + "name": "param_0", + "shape": [ + 32000, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65536000, + "byteOffset": 0 + } + ], + "md5sum": "ece1151341dccecec890647e0adf406d" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 33357824, + "records": [ + { + "name": "param_1", + "shape": [ + 32000, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192000, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 8192000 + } + ], + "md5sum": "bd8981d692e125b5a00e4b6a7cae2422" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_6", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "a3fa50c3497a1b9ea9039db6cac1c7ae" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_8", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "69a025e2b1db365ac6233b53cdbebde5" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_12", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "ceea8924283a459e4a22546e7f88e7a4" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_3", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_4", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_5", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_7", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_9", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_10", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_11", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_13", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_14", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "899012c14105657124da323ae9b7edbc" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_16", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "e9d940ba64169c4a20099245d2b741a1" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_22", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "a8f2de76adde641c3eeff214526c4c25" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_15", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_17", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_18", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_19", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_20", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_21", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "5b4b11a003a98d2898fb8d80a325e330" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_26", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "bdafe526a555a519a270c7f76ff4e277" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_28", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "d6bc92252d2362030d269d231f14fd21" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_32", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "5fc906b03fd15ff4d40225458dfcc3f2" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_23", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_24", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_25", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_27", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_29", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_30", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_31", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_33", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_34", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "67e1d17d317d5f56c3bacaff34015f00" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_36", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "3e1f9b33a39cca907af516bc89af1ab7" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_42", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "c0a6b986b5a0da7fa8ce08f85707b187" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_35", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_37", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_38", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_39", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_40", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_41", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "da92f1d99a11636a7e5914d1f2921d25" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_46", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "eb27bd909a324cde3837bea5dc80fb76" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_48", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "b5ffe359ed1d7e811ae2f8b566eb92d5" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_52", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "322386c573f8080bc520fed1cb2c956b" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_43", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_44", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_45", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_47", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_49", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_50", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_51", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_53", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_54", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "624a019590e9a498b5d18e05d83894b8" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_56", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "e6d8b8c5b7877c841a2ea536945d97ba" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_62", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "a3c402dbec2d1dafabbbfa5c1eddfb1f" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_55", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_57", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_58", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_59", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_60", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_61", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "bb276eb47a9a93c5cc58566095ad4548" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_66", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "15cba2764788f351de81ac5f9dad193e" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_68", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "00183c92850e786ea2b912a0954e9294" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_72", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "edff072b648d0d47232a21de0edc553c" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_63", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_64", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_65", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_67", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_69", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_70", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_71", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_73", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_74", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "77617f8a8b22489cde8315214ebf21fd" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_76", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "58b429e41047d0f6c130d89bc84b598f" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_82", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "3462f9f326b0644d91a33bb5b5611c23" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_75", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_77", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_78", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_79", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_80", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_81", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "446f1c1ca373370b9a28d9a465f54dba" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_86", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "b0a289775b0c123271c7b315252af49d" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_88", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "db0443c26f7d7d20ff259f8b36efb867" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_92", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "8f57c7ab7ca22dc43a4dc9a06b53be06" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_83", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_84", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_85", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_87", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_89", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_90", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_91", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_93", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_94", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "ac20bb60e2149a55d86b20a6928f89f0" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_96", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "ed4a874599224759db86cbf0bb8c4e5f" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_102", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "d6e7e2e7ecb6bebeefa8eecf70947222" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_95", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_97", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_98", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_99", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_100", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_101", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "fdd6208edbd7738fe69380968a296bf1" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_106", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "bfd1c59d8b8762eb71bdcbf38e15d28a" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_108", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "448fe0a3e126ad96d74016aff08e0e43" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_112", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "2ae1ba41ae5aa869afb9b57890e37184" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_103", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_104", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_105", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_107", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_109", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_110", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_111", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_113", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_114", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "a12e88681a4e10f3e62db1e98a8d7ea5" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_116", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "f1895f944ad87e9728b25abb2f6c94e8" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_122", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "84a3f41aca432dd5651e43ec5aa6d6a2" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_115", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_117", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_118", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_119", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_120", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_121", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "06bd8db0ce1dcea1c0cf75242735752f" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_126", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "a2ced1ae74c15bddf7662d2483dc831c" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_128", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "1de06d78759029f201a0a13e66b03114" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_132", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "3ee0c67c18503b112119afa9655f6ce9" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_123", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_124", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_125", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_127", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_129", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_130", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_131", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_133", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_134", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "80104f4150c89920e0a410acb83711f8" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_136", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "7b6ca0cb272a374603ece2b2c65d5b6c" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_142", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "19926c97cb3ccb3fe8e17b6a881d3d60" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_135", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_137", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_138", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_139", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_140", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_141", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "dfeff31b6d980ba07ff311228dccdb0e" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_146", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "9413d2845653d88ca869554d6dd4515d" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_148", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "33d6b1f58a5665d7e3242aff9db47514" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_152", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "025617bf137bf1f744f638a69ef5eb84" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_143", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_144", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_145", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_147", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_149", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_150", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_151", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_153", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_154", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "2c657a08d9e66ebfdbca0dea52710b28" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_156", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "7914d46ab1a0be1d954a1f9a812330b5" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_162", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "2998c328d4dfd0d010d97909ac2dc177" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_155", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_157", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_158", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_159", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_160", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_161", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "4791216ff3a63f28c1558e52bacb10b5" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_166", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "559eef05a8545f78f1e5dcc1096dc64b" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_168", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "e0fec23bb9981d2432fe2c4206659422" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_172", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "e9d28ccf1ad59fd6c63dbf3fa4f08ad1" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_163", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_164", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_165", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_167", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_169", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_170", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_171", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_173", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_174", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "e40d322af048cf1724973ea7ff249fb5" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_176", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "118981e1b26ae3b7bc01cccd7767d5d1" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_182", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "f037570b706b5f8f275a48424e74f131" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_175", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_177", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_178", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_179", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_180", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_181", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "efff06e134fec9a2fb23084bb94462f7" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_186", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "9568bef8132ddcceb420c893bdca4db4" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_188", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "1efce38e0e8abfd053b8825f62b97794" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_192", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "08c19412307fd0bb0a739b3c7d56c732" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_183", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_184", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_185", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_187", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_189", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_190", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_191", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_193", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_194", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "a8ae53cc765d442f65f9c6370abc727a" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_196", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "8317d5e75386e7e5c0193a3fce95ed91" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_202", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "d27bbdd264bef7af1f8fe3d65564b1e3" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_195", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_197", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_198", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_199", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_200", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_201", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "c1c21326fbbc111a6ed4092637ad0856" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_206", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "73b55633f68741b14b76d5bd92960543" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_208", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "52cc37d9b497f3a6147b58593c75f879" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_212", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "8ba0c925bf129c2de403301053d0f9fa" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_203", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_204", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_205", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_207", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_209", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_210", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_211", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_213", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_214", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "bf9b958009e75b014d051941e1e853a0" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_216", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "fa67b0527d7fe960566550d100db8f9e" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_222", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "ba9014b453495fe1636d42a9264eebd0" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_215", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_217", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_218", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_219", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_220", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_221", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "d663dbd7554382124d72f6b754298a87" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_226", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "076c3fe92cab4fb6e313a71aa929ddb3" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_228", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "7d6c2a42414f8bb2f4ea9ad299b529e6" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_232", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "f1b958ee45a947939eb9c3aebf1bec39" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_223", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_224", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_225", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_227", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_229", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_230", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_231", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_233", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_234", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "a48b4214ffb395eac1396f4251181d7f" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_236", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "bc49f2f4f0a420a6610a5038e84e4edf" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_242", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "e9711331d06f0b8f3a2b0decbfbc2ac5" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_235", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_237", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_238", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_239", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_240", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_241", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "d108ad63eb760886b5808983af9b4337" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_246", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "8f31b773f77ed6f2b2b1f6efa4cd1a69" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_248", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "e466cf95440c7ec65be944d3b573dd6a" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_252", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "1e3ad0992f3782f3812e3bcf4fc67891" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_243", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_244", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_245", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_247", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_249", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_250", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_251", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_253", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_254", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "3c11a5fef55fe8bb34857984edcfabeb" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_256", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "ee7d0049b0e83683c98a61dfe0c57fe0" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_262", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "e3ae79d6bd4b4770bb5995e65dcb0fe2" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_255", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_257", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_258", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_259", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_260", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_261", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "7a7a2497aa8af3ac9c14db093f87c8fa" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_266", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "edbfd11650e1559c82529c0cd5f3c6a2" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_268", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "e855907a404371d53aec12ac611551a9" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_272", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "69f7185a461844b057e5b39fc8374379" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_263", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_264", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_265", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_267", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_269", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_270", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_271", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_273", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_274", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "8279e8df06e99c2d7962965c35bb709c" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_276", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "1af48438885cd6c1fc6bbf76c339ac0b" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_282", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "8c459dd4d6118f5dd6817a7433357329" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_275", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_277", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_278", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_279", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_280", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_281", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "919f21b25152b4a3f4399e40abeaaf02" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_286", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "5dd2171bd06bc7b1350f66ecbb4815cd" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_288", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "9cbb16e5c05481e015944f1661ac3db3" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_292", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "977e51bb26eb58e4855d1b010cbade3e" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_283", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_284", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_285", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_287", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_289", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_290", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_291", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_293", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_294", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "9121656e4c2eedd0ab11678445c9d9fd" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_296", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "e98b170d328b10c630a54277b22ffcfc" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_302", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "fccb8f644ba2fadfcefc478cf4ac9492" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 32063488, + "records": [ + { + "name": "param_295", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_297", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_298", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_299", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_300", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_301", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + } + ], + "md5sum": "588d4fba64d289d77e536726d12291f9" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_306", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "e5b1f7d1b2b335377349813e39bbb040" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 22544384, + "records": [ + { + "name": "param_308", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 0 + } + ], + "md5sum": "f020e70fea1c828d87fa1d941501e003" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_312", + "shape": [ + 12288, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "a5499f8c46fcb9250d398f57e268e043" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 32587776, + "records": [ + { + "name": "param_303", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_304", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 3145728 + }, + { + "name": "param_305", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 11534336 + }, + { + "name": "param_307", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 12582912 + }, + { + "name": "param_309", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 18219008 + }, + { + "name": "param_310", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21037056 + }, + { + "name": "param_311", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 21045248 + }, + { + "name": "param_313", + "shape": [ + 12288, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 21053440 + }, + { + "name": "param_314", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 24199168 + } + ], + "md5sum": "91b433a79efcd7ef372f4e33ea5c0bf9" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 45088768, + "records": [ + { + "name": "param_316", + "shape": [ + 22016, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 45088768, + "byteOffset": 0 + } + ], + "md5sum": "e79baf1d0ad3cac962c0f35543c0f31c" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 65536000, + "records": [ + { + "name": "param_323", + "shape": [ + 32000, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65536000, + "byteOffset": 0 + } + ], + "md5sum": "959656d0e7064e832d774e1cb1b3bc67" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 32071680, + "records": [ + { + "name": "param_315", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 0 + }, + { + "name": "param_317", + "shape": [ + 22016, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 5636096, + "byteOffset": 1048576 + }, + { + "name": "param_318", + "shape": [ + 4096, + 1376 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 22544384, + "byteOffset": 6684672 + }, + { + "name": "param_319", + "shape": [ + 4096, + 344 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2818048, + "byteOffset": 29229056 + }, + { + "name": "param_320", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32047104 + }, + { + "name": "param_321", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32055296 + }, + { + "name": "param_322", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 32063488 + } + ], + "md5sum": "9cd331ce1d1b70313bf19e07fd026b04" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 9240576, + "records": [ + { + "name": "param_324", + "shape": [ + 32000, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192000, + "byteOffset": 0 + }, + { + "name": "param_325", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 8192000 + }, + { + "name": "param_326", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 8716288 + } + ], + "md5sum": "f5670184515a7d18f8cea44ebb717eb8" + } + ] +} \ No newline at end of file