diff --git "a/ndarray-cache.json" "b/ndarray-cache.json" new file mode 100644--- /dev/null +++ "b/ndarray-cache.json" @@ -0,0 +1,4395 @@ +{ + "metadata": { + "ParamSize": 327 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 65536000, + "records": [ + { + "name": "param_0", + "shape": [ + 32000, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65536000, + "byteOffset": 0 + } + ], + "md5sum": "010e0e984a7a5c101ae350bb3efcdda2" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_6", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "18ddac48ecf74081841460721ba178e1" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 31784960, + "records": [ + { + "name": "param_1", + "shape": [ + 32000, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192000, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 8192000 + }, + { + "name": "param_3", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 20774912 + }, + { + "name": "param_4", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 22347776 + }, + { + "name": "param_5", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 30736384 + } + ], + "md5sum": "eb39022c7824d26951f7410ba2f1197a" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_8", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "b7a5c9f40e7e0420ca54da5ea824a79d" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_7", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_9", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_10", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_11", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_12", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_13", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "81a9e9450934f290f0f19077fa92f279" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_16", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "632492dd4047ded4f5976d6c28144e21" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_18", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3b007034a4cb24a6fcb5e1f7a75f7cb1" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_14", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_15", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_17", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_19", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_20", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_21", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_22", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "5fdf3d559a964dbdc0f117d1b9985072" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_26", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "167ca2bcc8bf37110692d2e626b02522" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_28", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "be367a60ca1173746d543654d887ce7d" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_23", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_24", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_25", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_27", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_29", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_30", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_31", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "d1ac6c3a2c11bafcee4dfa7535e97ff5" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_36", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "72a0a028bbb561115a5d945ef9537fad" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_38", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "0186707d7e733b3b23d0ccb43f0744af" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_32", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_33", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_34", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_35", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_37", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "e3b5da9e01a09fbed893a93ab14e2a91" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_46", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9dd5bf4cb999c9c531f0515c2c5e551b" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_39", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_40", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_41", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_42", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_43", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_44", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_45", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "7cfa6e3a23e6c8300934687eab5a4ff6" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_48", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "24c92a047c05f93ede773d1cf6baa3ad" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_47", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_49", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_50", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_51", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_52", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_53", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "d34283639f554124c509d26a21196add" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_56", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "5c9e5ff394137caf6369d600d8ff3e1a" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_58", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3b9ba512284d33cf95b81f9078ee4851" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_54", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_55", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_57", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_59", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_60", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_61", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_62", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "b36a5a4530d8deb9b23914c13347160d" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_66", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "45c87fb61e3e610d29e3ccfdfe6016b2" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_68", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "dc68c0b35a95a28562de34da5c0bbf4d" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_63", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_64", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_65", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_67", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_69", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_70", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_71", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "efc1169ded5c0e6bb91c8fff9421fbc3" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_76", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9d7f127fa33c1ba611a4d7c9b090adb1" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_78", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "5e243c8f28577a967fdd29234aa4340a" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_72", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_73", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_74", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_75", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_77", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "9b9f0d5b12d95625d1c62f23fb81fb5b" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_86", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "40020100b0d998e82c0bad8e31f4694e" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_79", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_80", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_81", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_82", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_83", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_84", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_85", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "be0e010827db00860d2e9c83ba190d69" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_88", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "75741ad534926f90550ed2bdd774c914" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_87", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_89", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_90", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_91", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_92", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_93", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "bf5835a74889ab5adbc13a75511ffbcf" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_96", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "4f365a97ddd810f012bd7aa7ed1e2803" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_98", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "b696245fa5bb9754f69c04a6eb9c2592" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_94", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_95", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_97", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_99", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_100", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_101", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_102", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "3f019e9ccef3e3d1a2cde371bd1affb5" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_106", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "4963c254463fd834b7c6c6dec62bc768" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_108", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "f287c1554d8d1e86000ec9570321d218" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_103", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_104", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_105", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_107", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_109", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_110", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_111", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "6867bc2427a3c297bd452014d3c77b0f" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_116", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "5f4dc4ed4aca799c504440e57fca2105" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_118", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "7b899f9ce568f52bc3682c89cf76eb8a" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_112", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_113", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_114", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_115", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_117", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "62b8393e818b4b67b2861856a06f1644" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_126", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "882ecdac7c0fd3e9c07d3d8fa89b6590" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_119", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_120", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_121", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_122", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_123", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_124", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_125", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "90bf241a78941c8c073491e0175a5cc5" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_128", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3e3b84268b4e142ef48dfc5f00f00326" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_127", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_129", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_130", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_131", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_132", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_133", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "f84d94f005ab5d42b4aa68c97be637a2" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_136", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "f568eb9b297a9a6d7a391948717b1e56" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_138", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "6e6379dad6a61b657f5bbeb949f30a9e" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_134", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_135", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_137", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_139", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_140", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_141", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_142", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "5a8fb529fbf3a6000e31c1e1993b2bbb" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_146", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "5dd23a6c6afe427946c4eb3db97312be" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_148", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "1716427eb7d5797efdd05538176aa1e2" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_143", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_144", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_145", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_147", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_149", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_150", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_151", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "0f31824636c65198ddf46cf0ff207606" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_156", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "313e63721cb47bfd745ea6375e8f3bc5" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_158", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "48508fb49739835752fc2dfb14c12e3b" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_152", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_153", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_154", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_155", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_157", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "b02b6d88de014c46bcd72349bf28903a" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_166", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1e8861609545adeb90af8d7387567501" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_159", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_160", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_161", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_162", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_163", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_164", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_165", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "de99184d6cfdc378970e8231c2473f58" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_168", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "c5effb73da28d9bc24ede9b127991b14" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_167", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_169", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_170", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_171", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_172", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_173", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "d4ae9e979dc972ac7cae149b04ed4327" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_176", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "3563a7deec08cba304aaf94286c936e0" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_178", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "e61c57698d9aa3367e53c83566720cbd" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_174", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_175", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_177", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_179", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_180", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_181", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_182", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "bd5262a818ee5120858b7e2da895590d" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_186", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "af88fa4430c14be6156b2a569767cd34" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_188", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "fb425f4a114a1a9b06f1efb8418cdc0e" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_183", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_184", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_185", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_187", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_189", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_190", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_191", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "35ff4c0470a0bcfc79a3ed0e2469d291" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_196", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "ec0ef966951c15923f35566d9081d00f" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_198", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "7cf92ca7b473df788677bf7997b6a6e5" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_192", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_193", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_194", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_195", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_197", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "870e5e676140b49b3f92b8e030fa29ad" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_206", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "49554aed7225e56281a095450a650c27" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_199", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_200", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_201", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_202", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_203", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_204", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_205", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "991f75587fe66c7c9cde68237ee5afbb" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_208", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "0cb3b295225d5e2044806c87d2419d2e" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_207", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_209", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_210", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_211", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_212", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_213", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "97f1c722d2db08ef0ef6e8dba6c197ca" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_216", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "eecfb64d040a26fef22eca693676b942" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_218", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "0943f7f844a2ae5d0108f0795ff8d999" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_214", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_217", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_219", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_220", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_221", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_222", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "c85ce4c771f60b3ab72c9bfb1d584a3d" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_226", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "4524f3ce2cf5fa63484a17263ef36424" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_228", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "3733694d43be7206c0bd3fd606177756" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_223", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_224", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_225", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_227", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_229", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_230", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_231", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "94a1124d6d8d337d671a777658b80f30" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_236", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "3c3585d0da985c53d322bf3cedf898cd" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_238", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "083ff7789a82b8a0500797f4510420e8" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_232", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_233", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_234", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_235", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_237", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "79ce10f566932dbaca20f6aa01bfb50c" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_246", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "dbd575b48c545ba628b764a742df1643" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_239", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_240", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_241", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_242", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_243", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_244", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_245", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "1779e65906e1640060d4cb2c6800cb4c" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_248", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "5d481e7c0a183ab76502dea078434df0" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_247", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_249", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_250", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_251", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_252", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_253", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "08c8baac6560e90372a9ccc66067626f" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_256", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "a3d40cb3331e0c82f771670a3a2d615d" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_258", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "5d1b442300a6d88d89e7a4476261b0d5" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_254", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_255", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_257", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_259", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_260", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_261", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_262", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "2cc30736918c5e3b8fb709b771237bcc" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_266", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1cb06f34117c0478719cdd5d9ae42e3e" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_268", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "65181c1462b79b6174104cf79837625f" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_263", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_264", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_265", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_267", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_269", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_270", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_271", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "e652845bb01e139851f7c590f03264b3" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_276", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1e86bd32337d529497b6a4921fd92b69" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_278", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "4aa1ab9c9f624d6da37f401dbe5546e9" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_272", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_273", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_274", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_275", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_277", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "a8d9243709c2b803f989693c7ae940ec" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_286", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "db143e93f149dd87a07e44ea65ad02bd" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 27279360, + "records": [ + { + "name": "param_279", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_280", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_281", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_282", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3686400 + }, + { + "name": "param_283", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 16269312 + }, + { + "name": "param_284", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 17842176 + }, + { + "name": "param_285", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 26230784 + } + ], + "md5sum": "ab09a4ebf7c38da97c3d5051d23a9b78" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_288", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "f6d00afdab0ef366f783d34ee9348492" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 25182208, + "records": [ + { + "name": "param_287", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_289", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_290", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_291", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_292", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 11026432 + }, + { + "name": "param_293", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 23609344 + } + ], + "md5sum": "3f6275e6c1c36c7312850ce9210e0843" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_296", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "da7abfc00787e84e7b96f02530136fb8" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_298", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "573712ca6d0d9bb635c2dfe84d4f922f" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_294", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 0 + }, + { + "name": "param_295", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 8388608 + }, + { + "name": "param_297", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 9437184 + }, + { + "name": "param_299", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 16777216 + }, + { + "name": "param_300", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20447232 + }, + { + "name": "param_301", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 20455424 + }, + { + "name": "param_302", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 20463616 + } + ], + "md5sum": "12ccbd012e997cd4425d7f1b55920bb3" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_306", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "ce677c57c0775ea85cc454452880daeb" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_308", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "ddfb1d8405df2801eece0af8eefe2e98" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 22036480, + "records": [ + { + "name": "param_303", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_304", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 1572864 + }, + { + "name": "param_305", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 9961472 + }, + { + "name": "param_307", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 11010048 + }, + { + "name": "param_309", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 18350080 + }, + { + "name": "param_310", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22020096 + }, + { + "name": "param_311", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 22028288 + } + ], + "md5sum": "1641d348e0e67b8b0a35a38373ea56ca" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_316", + "shape": [ + 28672, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "6a0af5b07f3a77fbefe0a5c622f5c849" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 29360128, + "records": [ + { + "name": "param_318", + "shape": [ + 4096, + 1792 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 29360128, + "byteOffset": 0 + } + ], + "md5sum": "f2f2db5490fd11f30264019b46c57163" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 30932992, + "records": [ + { + "name": "param_312", + "shape": [ + 6144, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "param_313", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 12582912 + }, + { + "name": "param_314", + "shape": [ + 4096, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 8388608, + "byteOffset": 14155776 + }, + { + "name": "param_315", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 22544384 + }, + { + "name": "param_317", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 23592960 + } + ], + "md5sum": "e9d9eca093921857e3a56e3f161ad7ba" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 65536000, + "records": [ + { + "name": "param_323", + "shape": [ + 32000, + 512 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 65536000, + "byteOffset": 0 + } + ], + "md5sum": "e6482125b3ae846df8eee6c33d75a634" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 12935168, + "records": [ + { + "name": "param_319", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 0 + }, + { + "name": "param_320", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3670016 + }, + { + "name": "param_321", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3678208 + }, + { + "name": "param_322", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 3686400 + }, + { + "name": "param_324", + "shape": [ + 32000, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192000, + "byteOffset": 3694592 + }, + { + "name": "param_325", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 11886592 + }, + { + "name": "param_326", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 12410880 + } + ], + "md5sum": "a6a2c0a93bbdfd9f2f7d70c7335ee5e2" + } + ] +} \ No newline at end of file