diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..d7e841ccd3c73445b6a8372edff64d62b9c52a34 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,4673 @@ +{ + "metadata": { + "ParamSize": 291, + "ParamBytes": 39722299392.0, + "BitsPerParam": 14.56926321506206 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.0.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "7db413de247aca08fe9236a2e9090e48" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.0.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "59c77c1eb45dcbec5f24042796d014fd" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.0.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "66271a8bfdc881d530bddce423a16473" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.0.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "5e6ad79422b84ab6817e84ce1eae9142" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 1137180672, + "records": [ + { + "name": "model.tok_embeddings.weight", + "shape": [ + 92544, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1137180672, + "byteOffset": 0 + } + ], + "md5sum": "c2c0dcdaa5fb65dc27c3af77f4be9222" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.1.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "6a67d00fca1fb44ec6c145f25edcf09d" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.1.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0f3bce60bc68c6b0486ab25e032f1bef" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.1.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "a56910c6a122b400b1b78632935484e4" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.1.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "a78aaa58397280571207a00af537581c" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.2.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "cbbc42abfea33905e066e923b4fa5615" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.2.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "3fb14b1507ee68a3cb2da640bf5f1621" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.2.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "0c3060a8a29e05e7fee9983220c66142" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.2.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "7565e5436c7cebbe2d0da90a2d314ee7" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.3.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "0df3bec71638aad48c3f6fdf43250582" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.3.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "cded647762891145b4f2708cfb0219ce" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.3.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "6c0da8fb8b983d34d16a700a4b026219" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.10.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "3aa943f7c89f892a6ff2cc6c5dcf97bd" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.10.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ef650d89e9f5561640e879d433eb9291" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.10.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "a59efb340313927ff568bb83d6189269" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.10.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "140bc29d20ec55db204d76c7757910d8" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.8.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "a45245fb0d0dcfadfca2ebb59d27b11f" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.8.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "6089e29b51b9445b391472dba762a4ae" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.9.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "67f22370f2e77097c0dd66e71dbed781" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.9.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "d0f49513aa0a3a998616d7fac6c31783" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.9.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "7f875669b4b20e1a195b3d6fe124b54e" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.9.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "b2abe5a96278a3aa700575d7c3974913" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.11.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "115da155e91aedc832328763ea5fe0db" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.11.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0f7ebef9ec340a3a76111f828a655fbf" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.11.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "2f98db679b023feef88e6e6161ca559e" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.11.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "91c1e7ace4cc6d5a811ffbe9e2091b82" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.12.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "0c127b17b7f497e819bfad9366395efd" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.12.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "3c8bbddb85a8a60221b60a36392dae0e" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.12.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "65e865d0402bd45bf47bdc53124ca7ab" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.12.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "f72453e64e6b45746f737ba3e873ad8f" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.13.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "bf8df85329a7581d062da7a3c49cea76" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.13.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f4607212cc716ca83ed380c0b7d8226d" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.13.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "33e947cea8860a6d7ca378a3c7e8f47f" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.13.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "2d2fbaa70fe5504c6893bb00bd341b15" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.14.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "58a7fae456e781a6349d68341fd472e7" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.14.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "aad5026e5d5235e5095116244220c107" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.14.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "f2bd511d42a447d508b23d9fc00cb071" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.14.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "79364dac6fa081b3497ed2a0f9899321" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.15.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "376f15535d3f62aa3f0b6891546d6118" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.15.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2c414d31013d54a7372866bff2a3e905" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.15.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "7c41335c011514c3c6e3b6fc998f1dc7" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.15.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "8a450e3c401107275f5d32c1234b6aa8" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.16.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "deadbfc6d8875d5e6cdad4cefa3685fb" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.16.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "cbb9e3961a34277734f849e45866714a" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.16.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "f5a4ce98c5d2e52493925a19c7654adf" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.16.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "442cb65ef56d6751250fec205f32206d" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.17.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "996c44fc4a143c6d313a6c1ab33751db" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.17.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "03f8715bb6374a621fcc498bddafdca1" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.17.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "d00a5c827c10b9efd8b963c56db13cea" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.17.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "1117c3033d8d3ac0b0d5a30ab12fefb6" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.18.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "39fb853910df32a025a6eb9ca4a25473" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.18.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "34904a27391a85623384e5da29c38e60" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.18.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "2a3eaef32fc92ccb6871327c8b875f5c" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.18.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "63e9e39b6cff6bc320e6cea70ba69639" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.19.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "a0b4ba9b944d8dbf07da9c0d087c1ba4" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.19.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "103771179c443ce4f4e28e7e06aebb20" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.19.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "7e687c9999b496d0009fd5635a48f33d" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.19.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "fc458af151395e439cac311eba2227bc" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.20.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "4b75a822656f9d5ef019b4aebbb86568" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.20.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "72d2fe17844cf036d734bd591202e73f" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.20.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "0b3cebdf40ae164954edabaed15831b0" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.20.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "7fc53cdd069a070f875ea52d2f34a00d" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.21.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "22e5b73efc709a50a55bee29ac9057df" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.21.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "4ce4eba3c2fe8fbebc02a092edecdd7f" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.21.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "de936b13fa07faeca154116205e9d2eb" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.21.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "7804e21972af4a0a98c4942116e28b6a" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.22.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "5fce8a96d1bf435bd8dc33611ddbf449" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.22.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0fc9ce7067c18cf479452ef08dcecb3b" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.22.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "4271a3890431078cc5ec4be13cb273f1" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.22.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "d03f2f509167fa77b85e331257422ba9" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.23.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "f026f30b4b7f1fcccaf64e6aaf938462" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.23.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "66d19ca9fee7430684548cce174d4e13" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.23.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "69a9e86d60c5ba00ff45ccf02794b67b" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.23.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "167de8311549bc8da52b1682e5bd7b44" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.24.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "779d094bb1c6cce6debfa64b638f5e61" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.24.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "3ea567219c3af38665ed09b6d1b16e2d" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.24.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "2296ab0d0df0cc8d1a4bd3a8a5e06f4c" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.24.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "aa990ed8557bc5a8e003486d56f4e187" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.25.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "58b0ca9f82716be7e75b4fb7455b1e0f" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.25.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0c0aebabe5bacb9624c63a0c6a2a4982" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.25.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "ae149d0cbec934811f4fd3a4d28ae2fd" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.25.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "35390a0c485b710883f77d26dc145867" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.26.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "abe647676c59ff8962a8c57567ddd83a" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.26.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "234c054cc614010c6798441f9f33617b" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.26.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "dbbab3c909bc282209abe32d6f29820b" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.26.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "43bca02513e73101ecc185d9e9efa6b5" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.27.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "95e85002434e9c1d8695f865ce51ebdb" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.27.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ed986c68569f42b1c0d0dc3f4ed884c5" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.27.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "64bf6132b570a610b7247f680862f2b0" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.27.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "97257a4bf41f98824cd5c30a4fa53073" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.28.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "394ed581bc5d2e2998d06a4c3a028b33" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.28.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "96899c819298dbdeb12c7789383ed44d" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.28.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "5bf4c2b3bf9c19b599d4d9c3bba6d73c" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.28.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "c1b9e2eda5bf8720513b8c8f65bd943a" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.29.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "c0a1708ab31208cdd0c6d5363d6d8093" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.29.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "838bd986ce2b844f216547d20c13b95e" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.29.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "755c0156a106a48c4f09b4d20db1b948" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.29.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "f425cc44a1efd94696cc7e9de4ca49c4" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.30.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "9386cb4e7eb3d5ee5a979bb7ac401c14" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.30.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "86a6705a6e9371f902e0be4c636bc4a5" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.30.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "ddf2fad7986595d974215da056b5fbf8" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.30.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "df3f83c9f0b140cade318c7935ecfae6" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.3.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "1afed988133967734c5b986e67fa77f9" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.4.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "208154e4e96d7b69943d25dbaea017e0" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.4.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "e93ef785e28cd634b7c9fa27a2302e89" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.4.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "dbb3f9f1c03e11b8979f5e5c71b97161" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.4.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "b2047ed1a305ce22e9033c3087ea6dd1" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.5.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "9e4f4bbbd333758f10304c222b059adf" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.5.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "621902bde2f85d5f7b769d9edec80627" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.5.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "bd0ff996707fdbd4014b85e59a9902a7" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.5.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "4e26cb8217bba4d5146f3e379bc16a5a" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.31.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "a7c7b64f3dfa86ce363887dbb9cd513e" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.31.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ad296d6a68401a33255105f1357b42b5" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.31.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "c5f0790a4f97440bd213fb188a3af04b" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.31.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "bb56c06177c45c5bd2918981fa0cc481" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.32.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "08b57ff23c3674814561cede73380547" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.32.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "e58867d7ac6d2ec5c9b4ebea874cef29" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.32.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "df1b606f74f2f5be355a3520e19772dd" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.32.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "f1efc78efe9c02501a66cfb689cf6a3c" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.33.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "5da48a915e2929f04ec1396efecb0c11" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.33.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "d4d9c37a234cd8036d9ea0017d411ffe" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.33.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "af43da9fdb44e7935315c9cb21836bd0" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.33.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "c4d0cb7fb30a658097c55565769664a4" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.34.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "f469789ef1e085ab677689b7a1676fbe" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.34.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "9a0a4f84967d2300b4e53f2e756729e0" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.34.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "10365a52603934a5d50603ff4330703a" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.34.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "b8029e5306d1592191b2723a18600d45" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.35.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "7556d983866e211fa47eb789514fb419" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.35.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "55d01740e75910478c7f74ec12a03d91" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.35.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "917a37e221e779cb91538f8688e2652e" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.35.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "bdd848bc9a8851a6bdd5267d82e93d1d" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.36.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "669c98169ce559d5dea183321e2d1f77" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.36.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "7872deaa142c04564b60ecf747d6c64e" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.36.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "f3be3dc845e43f554795f99cdfcfe056" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.36.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "604a687ccc4eda5384c0cdd6bfb7ce8c" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.37.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "c8d84ec208254fedf2a501cf11387b5b" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.37.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a65bb61f3410797558e33f35224da13a" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.37.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "6797a4c7ef7f2259e464bf163d050846" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.37.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "536829d2be23bd13a427d6bc71209e86" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.38.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "0400791d56834f98233c6d49c0551cb4" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.38.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b0fb70adc1ae7a7ccce055f7e14a860f" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.38.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "d6edf85c6e98e21bc1c20e19711e9d0a" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.38.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "cf7deb1a5452e19b9555e838e76e8d53" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.39.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "7aa85dd5098c8da2322d847f135c82e4" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.39.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2e3dadee443611c5c500e209923f40f2" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.39.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "ae5ff02ddc94b63e22feafa08835eadf" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.39.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "cd40690067c1fc56e5691dc42f9573dc" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.40.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "bca8b308788f3142f45b18eb32d79d01" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.40.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "557e4ad17874e2552be46fb22818ec1c" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.40.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "aaea8ca7014a58e446d285a8ddfefe09" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.40.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "ef63b0787d5a92af34ca536bb84f7164" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.41.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "05dcca9cd56a9636a9484df68b068351" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.41.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "89e72bdc3a6de41a45f81f8062bc9957" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.41.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "f3c856eb9e9de74f6d0cc852d3b8b921" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.41.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "83d2bb1e1ee58fa9e75650b7f166ece2" + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.42.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "9a07a3bb1028bdb25065cc80d6ff5371" + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.42.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "8274125b1c0b68ff93ef8b9d983a3033" + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.42.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "8ee5fd9692c64c3db42bf23f398d26ce" + }, + { + "dataPath": "params_shard_162.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.42.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "3ecfb92f2e0dbb32a9eeca40890341ce" + }, + { + "dataPath": "params_shard_163.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.43.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "3aa9885182a7319e2437f23d31342ef1" + }, + { + "dataPath": "params_shard_164.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.43.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "fd5619a8fe09763661d26c3d561208a0" + }, + { + "dataPath": "params_shard_165.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.43.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "1d162302debd25d0738ebc27e3845f6d" + }, + { + "dataPath": "params_shard_166.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.43.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "e4a91e37cd73d9771f0582183591e19b" + }, + { + "dataPath": "params_shard_167.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.44.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "bed296e48e01809cb8212c76825a665b" + }, + { + "dataPath": "params_shard_168.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.44.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "08b639d0c18fcbf7c1a63fb749c5fa9b" + }, + { + "dataPath": "params_shard_169.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.44.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "7709a967a0c53f0efc08eeb59241cd4e" + }, + { + "dataPath": "params_shard_170.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.44.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "143bc4d87bca35dc24a66f9c75c7e115" + }, + { + "dataPath": "params_shard_171.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.45.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "55ba57cff3ea364b21d309c6913dce62" + }, + { + "dataPath": "params_shard_172.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.45.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b915ec4f1a2bd7b9dd4caf2280583c7c" + }, + { + "dataPath": "params_shard_173.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.45.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "966fb0b1ad391b49d663ef61a7097c5d" + }, + { + "dataPath": "params_shard_174.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.45.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "ca0ae515b744050af3357f02553ee0a2" + }, + { + "dataPath": "params_shard_175.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.46.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "975731a3575a366de954484c040611d2" + }, + { + "dataPath": "params_shard_176.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.46.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a7a90fffbc267a8794a0d749a395466a" + }, + { + "dataPath": "params_shard_177.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.46.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "091009488a5c71860f1887ef965c433f" + }, + { + "dataPath": "params_shard_178.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.46.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "bbba14991bf109f5a4343bde92618bcf" + }, + { + "dataPath": "params_shard_179.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.47.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "5af00b0e44df026910ce20f1ce1ea148" + }, + { + "dataPath": "params_shard_180.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.47.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ae2639212fe60abadedffff3988c2467" + }, + { + "dataPath": "params_shard_181.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.47.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "01f1fae460e95c1a2b4a4698d6491a7f" + }, + { + "dataPath": "params_shard_182.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.47.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "e35e3802e509e8248c9d0d65ffb4d84d" + }, + { + "dataPath": "params_shard_183.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.6.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "000574e1f5c50c785709e320aae224be" + }, + { + "dataPath": "params_shard_184.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.6.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ece6470c49ccf429481fac9d62cdb081" + }, + { + "dataPath": "params_shard_185.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.6.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "982b234ab6c6dbb3af157be8426f6448" + }, + { + "dataPath": "params_shard_186.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.6.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "7dbef8765e3ff403d9f3a26e33cbece6" + }, + { + "dataPath": "params_shard_187.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.7.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "63a11aa5b639ae8a4b92c37f8d3206e7" + }, + { + "dataPath": "params_shard_188.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.7.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "5244855502245015ee7e5e293593aebd" + }, + { + "dataPath": "params_shard_189.bin", + "format": "raw-shard", + "nbytes": 402653184, + "records": [ + { + "name": "model.layers.7.feed_forward.gate_up_proj.weight", + "shape": [ + 32768, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 402653184, + "byteOffset": 0 + } + ], + "md5sum": "e81ede3b54e31a30cf854b89a1ff3944" + }, + { + "dataPath": "params_shard_190.bin", + "format": "raw-shard", + "nbytes": 201326592, + "records": [ + { + "name": "model.layers.7.feed_forward.w2.weight", + "shape": [ + 6144, + 16384 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 201326592, + "byteOffset": 0 + } + ], + "md5sum": "d44a76d8f61f376a4268aef32ed059d7" + }, + { + "dataPath": "params_shard_191.bin", + "format": "raw-shard", + "nbytes": 75497472, + "records": [ + { + "name": "model.layers.8.attention.wo.weight", + "shape": [ + 6144, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 75497472, + "byteOffset": 0 + } + ], + "md5sum": "ef10714372f5ad230109ebaca8a4c09d" + }, + { + "dataPath": "params_shard_192.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.8.attention.wqkv.weight", + "shape": [ + 8192, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "97179e5140290259938be5fe5033d0b1" + }, + { + "dataPath": "params_shard_193.bin", + "format": "raw-shard", + "nbytes": 1137180672, + "records": [ + { + "name": "output.weight", + "shape": [ + 92544, + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 1137180672, + "byteOffset": 0 + } + ], + "md5sum": "466cef09e5f4201900768e4ffb19c0d5" + }, + { + "dataPath": "params_shard_194.bin", + "format": "raw-shard", + "nbytes": 1191936, + "records": [ + { + "name": "model.layers.0.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 0 + }, + { + "name": "model.layers.0.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12288 + }, + { + "name": "model.layers.1.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24576 + }, + { + "name": "model.layers.1.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 36864 + }, + { + "name": "model.layers.2.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 49152 + }, + { + "name": "model.layers.2.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 61440 + }, + { + "name": "model.layers.10.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 73728 + }, + { + "name": "model.layers.10.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 86016 + }, + { + "name": "model.layers.8.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 98304 + }, + { + "name": "model.layers.8.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 110592 + }, + { + "name": "model.layers.9.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 122880 + }, + { + "name": "model.layers.9.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 135168 + }, + { + "name": "model.layers.11.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 147456 + }, + { + "name": "model.layers.11.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 159744 + }, + { + "name": "model.layers.12.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 172032 + }, + { + "name": "model.layers.12.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 184320 + }, + { + "name": "model.layers.13.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 196608 + }, + { + "name": "model.layers.13.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 208896 + }, + { + "name": "model.layers.14.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 221184 + }, + { + "name": "model.layers.14.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 233472 + }, + { + "name": "model.layers.15.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 245760 + }, + { + "name": "model.layers.15.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 258048 + }, + { + "name": "model.layers.16.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 270336 + }, + { + "name": "model.layers.16.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 282624 + }, + { + "name": "model.layers.17.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 294912 + }, + { + "name": "model.layers.17.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 307200 + }, + { + "name": "model.layers.18.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 319488 + }, + { + "name": "model.layers.18.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 331776 + }, + { + "name": "model.layers.19.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 344064 + }, + { + "name": "model.layers.19.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 356352 + }, + { + "name": "model.layers.20.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 368640 + }, + { + "name": "model.layers.20.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 380928 + }, + { + "name": "model.layers.21.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 393216 + }, + { + "name": "model.layers.21.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 405504 + }, + { + "name": "model.layers.22.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 417792 + }, + { + "name": "model.layers.22.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 430080 + }, + { + "name": "model.layers.23.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 442368 + }, + { + "name": "model.layers.23.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 454656 + }, + { + "name": "model.layers.24.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 466944 + }, + { + "name": "model.layers.24.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 479232 + }, + { + "name": "model.layers.25.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 491520 + }, + { + "name": "model.layers.25.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 503808 + }, + { + "name": "model.layers.26.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 516096 + }, + { + "name": "model.layers.26.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 528384 + }, + { + "name": "model.layers.27.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 540672 + }, + { + "name": "model.layers.27.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 552960 + }, + { + "name": "model.layers.28.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 565248 + }, + { + "name": "model.layers.28.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 577536 + }, + { + "name": "model.layers.29.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 589824 + }, + { + "name": "model.layers.29.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 602112 + }, + { + "name": "model.layers.30.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 614400 + }, + { + "name": "model.layers.30.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 626688 + }, + { + "name": "model.layers.3.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 638976 + }, + { + "name": "model.layers.3.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 651264 + }, + { + "name": "model.layers.4.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 663552 + }, + { + "name": "model.layers.4.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 675840 + }, + { + "name": "model.layers.5.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 688128 + }, + { + "name": "model.layers.5.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 700416 + }, + { + "name": "model.layers.31.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 712704 + }, + { + "name": "model.layers.31.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 724992 + }, + { + "name": "model.layers.32.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 737280 + }, + { + "name": "model.layers.32.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 749568 + }, + { + "name": "model.layers.33.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 761856 + }, + { + "name": "model.layers.33.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 774144 + }, + { + "name": "model.layers.34.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 786432 + }, + { + "name": "model.layers.34.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 798720 + }, + { + "name": "model.layers.35.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 811008 + }, + { + "name": "model.layers.35.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 823296 + }, + { + "name": "model.layers.36.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 835584 + }, + { + "name": "model.layers.36.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 847872 + }, + { + "name": "model.layers.37.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 860160 + }, + { + "name": "model.layers.37.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 872448 + }, + { + "name": "model.layers.38.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 884736 + }, + { + "name": "model.layers.38.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 897024 + }, + { + "name": "model.layers.39.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 909312 + }, + { + "name": "model.layers.39.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 921600 + }, + { + "name": "model.layers.40.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 933888 + }, + { + "name": "model.layers.40.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 946176 + }, + { + "name": "model.layers.41.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 958464 + }, + { + "name": "model.layers.41.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 970752 + }, + { + "name": "model.layers.42.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 983040 + }, + { + "name": "model.layers.42.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 995328 + }, + { + "name": "model.layers.43.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1007616 + }, + { + "name": "model.layers.43.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1019904 + }, + { + "name": "model.layers.44.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1032192 + }, + { + "name": "model.layers.44.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1044480 + }, + { + "name": "model.layers.45.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1056768 + }, + { + "name": "model.layers.45.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1069056 + }, + { + "name": "model.layers.46.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1081344 + }, + { + "name": "model.layers.46.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1093632 + }, + { + "name": "model.layers.47.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1105920 + }, + { + "name": "model.layers.47.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1118208 + }, + { + "name": "model.norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1130496 + }, + { + "name": "model.layers.6.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1142784 + }, + { + "name": "model.layers.6.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1155072 + }, + { + "name": "model.layers.7.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1167360 + }, + { + "name": "model.layers.7.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 1179648 + } + ], + "md5sum": "80e313b0363be60fb7c8c56c2175d304" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..0eea34950d0f2e7582f3791fc60404dace0bef98 --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10343310dced66dc4dad85c0a3ab7486f36baddb2fc3ead4a3afd52fa495fb60 +size 75497472 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..c2cfdd157f8a6d10f322f45805f132bccb220d9b --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6c6d426495f66047c737b9b1a0699f48f6b49fb85d1ca63b753a48c427e15a5 +size 100663296 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bcd845ef85f94699b6ee300a4c811a8bd00514c --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714b1a41849f418022fa1e3f3fbc1af410ebb395674863c1c61470946471326d +size 100663296 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..92f21dadfea62977c2a01a48f3b8270677de1a8b --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8abb50942fb7fc475fa99edae3fc6292e85bb183185b2b261c1bcd43a565a3 +size 402653184 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc8d41561057e434ec798071e5d9a45884640502 --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7318caacd2d01f90cc8153f3917863c892d732ae64a1c7a64f6722d7b3048e77 +size 201326592 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..c0469b7df0f6ebb6b24049c90fcd6374fa23e947 --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52fd03a7f43d101b31e5102f319cc3180df047f98e7b6f169ffb46faeb8670b7 +size 75497472 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed24df366e1455f08519f9f28fa5cc410b46f47b --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7faaeabb5d4efad6d550e17905a34abfcd98ca9c9bfa142e4b5b6be0dd73fb6d +size 100663296 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..79cc4082bf5f1d6b36317a1dff96658c007e8bda --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c045a946a4ee2be6ef255babf5ad0afde6ce340179e3f225a9a4cef76fff9c +size 402653184 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..394f8e1e85677c9492c44118c24ceb2f7b5971cd --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90a5bc5173371c2634fddbe302b745ac9415491e70c187ff66e20f673bd59dc5 +size 201326592 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3a3978220ee76f0b61bf8d28c0e1a1da7563698 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4fef6d545e2339446dfaa8a44be45ea1a43db45f126c629790530a7a42ec05b +size 201326592 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..f28008d819aac8260c8e3e8f4ae2c2e1e30d7750 --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf4153377b890e9ff3f96ac7e33651c9304ff0bc846ad74983c51e6fd28b7127 +size 75497472 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..0916e0650c84ba1fde826e7a9f5d742009cd11e8 --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db93157283eef94e803592070c9002c30955c55a5439ec23a5b0931b96d34387 +size 100663296 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc5ed55bcf6ac3c0a52e53cac304a6b83a901f2c --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df081958ec6683c9f68b44af67a61a2730d31d193370a811d14d19eeab790cb9 +size 402653184 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..7231ba3e9fdb6aad4a17258def39395147d740b2 --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a419408a722961a2632fab9dc8666796c62b9d0a1a4cfa539b42f655ba8db9b +size 402653184 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..57aa4040411927c5719136db574aa9d8066b32b6 --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f62ffe7474e52bafcfff0530d8521914559b845c9fa9252b035544724e2af1ef +size 201326592 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..ebb21dd81ca47b4ecd65816cb7458aa184369806 --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05173a3b9aa062822f75393aca4381acbcb8ffb38c67fb4eb006e6807ffac066 +size 75497472 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..8815d255f16dddffa536537eb5dd80f3bf648820 --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdee0d682d58771039ec78d76a4d4390b1e6e2a471fa28b035fd5fa9d9e5bda6 +size 100663296 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..d634b1609de49638e5df1d1fbb751d4df1a5822a --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4680e4d791d3bf301f31b540f0541a7e2bb29b6d96c00c5480bbdfd695214d2f +size 402653184 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..8eed34df39fcf510b2436541d12dfa632ea65a28 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d8e6c23c70dc1be3735c67f4c01e4055dc024b97458ccb9f2f8af018062d311 +size 201326592 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..6b2b584745559b82d80771ed951ead8e7718bc31 --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7705c2da3d54a72ff654490951626bbf8a71e65bc97073458964bf43de9da0 +size 75497472 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..6001509520d55af64845ab3d1613e7ef8cca0296 --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc3674eed9dad4804177939064427e042a2646bdc3ee8d38eae75cf6f3045a69 +size 100663296 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..59c73f3407ac93c08e8d9ac5c4ad81bfd43141ff --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853c95c1a0748297620ea1d92981c31cbb06b820c2be9f08ca8349e9655cf9c9 +size 402653184 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d9b21317c77a834b57c9eaa98e9ae07abd1feac --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce254406ef75ffe3075652811db088be74bd1d7190f51e79c085970f8daca702 +size 201326592 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..c1f0821b7da305ed62ffa835543751b5e9a4e742 --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c45dbdb358ba390a8d20024c13d8750c5fc8e3e381f37380d13652514ec9e046 +size 75497472 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b09f0c94f71ace05ff615e865dcf965ec024202 --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7beab71c0ca3b0cf14585c9a1837c9b02563e06d07da57bd40a8ad96d518b485 +size 201326592 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..212e72c426b9f08be7b7d6ccaa9cac32e5f6e4ed --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cc8250d9cdb29a3f99b9114c5cf1d1ad0a7217df388e9d9f58ebccc7c025d6d +size 100663296 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..622de054afd095ca50b531a1edc7b3f8dd964b62 --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d40ed03ce3d4cfba117690d53ad9f1e5f11d8823cb6ae4b833369b9b30878183 +size 402653184 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..98bdfc5147fdb8c078ecd72c5712dce3e7e794cd --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43aa56e5588f9477830281e29748789b64d981f4e1e30f5188942d4ba9a5252e +size 201326592 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..34cedee6e84a5a462b3a63d2a98611a4ae43c6bb --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37979a37f7ddc92c137a2d4b8a800eb6542721949e29fddb31672c1444b71397 +size 75497472 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..f745fca4ddc217e0ef583e1e97e2e865732e6ee5 --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e6d8e3feb21e8edbd2c115fd44281b2ddf71da1d450e968418f5086209fac8 +size 100663296 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c98b5cffa078ec9a4234cb1cb3a9e30e2b31a31 --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:089db085a4d1639e3b4bffd3608fb3c5307401b4c92d50b7e0612fee17b3ff11 +size 402653184 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..49be57a40df33ab936c23f647d51eb5eb749e927 --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca037edf7a274094f436c4107edab17dff79ef182043d9e6806e98c3ad5dc0b7 +size 201326592 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..1a99cd2d9ed04dfb9267f2930ba7f3c5248191c5 --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f1aa86ac0246dc3884106604758998d51045665414d98c32f148656e03359f +size 75497472 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..097fa71568877d8bb157c4323ad4f28b7ce990bf --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48a2e608245585e7916fcdc9274a13bdca226894aab47d1394f480852c252acc +size 100663296 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..fcba846fa478d30f82d2f427fdfe18dc34cffd37 --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6834f27dac30ab39c7ff0592d3653957a8a3fae8c8b17870d1afafb7ea4d85b9 +size 402653184 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba9086f8715d95459db177bc5000b6714648fea9 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416f1015afd629e6900ebb7fac50065ff9ec245ad91e3675a3b68ed19c6bec22 +size 75497472 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..542af57cb22e40dfc7fa0e1ab33a6fb74ff1771d --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5dbb0d2d1078a741e83d7da2d1e966e7f181ce5c315b1c62dd152d7f1ebe6c1 +size 201326592 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..08a1913df306202ff5a0f0cb248efd7291450475 --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b92ac8b3e2ea65dcbe7b0a51402a305cb5ed1c8545d153f0d5bdec7a702e928 +size 75497472 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..b98fa7c3307f740ead35aec07195269a33ceebaa --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81a5bef687044e41e0edce322640b9c4abd0aa5396eea34c59081fb95d2fb52 +size 100663296 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..9366227878c8f6345e718cf4b03d3ba5c9c5c9e3 --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7e482991f8e269f0ab6daeeef4353c86bf05ad6418e98e4094b15b36ba0c8c9 +size 402653184 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ca7d84cb775f3a090d5b703a70174fe9ebb69a0 --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0300bb0e3ac41d78b0fc46cac674cc75295eb94c82b6ba0780e908087a7177e +size 201326592 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..4052ee978249118d20fb4d44f47cc9da163059a0 --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520a0671442f61143e36114c4639fba57825a60111ad908b0be280f833e9abf9 +size 75497472 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7ccc811d90870ac5dae4904d8863c262c9fb93a --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23e0c5e54704ee64e184aa8cfee12fdc50db543e555a45344f1fe121e40afbb +size 100663296 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..9357e24ebce5ba5ed14b9bc320b3ecdfe64f91b9 --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efef5a5514322c25365236643b4108f680e99551c7533bb5d2c9d5ca574a3be7 +size 402653184 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb974686f4e031d9663ce0c79a830216d7a6e39f --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5391ac1c8c256bccc718dbfb9ff2486d6086a9f51e11f05339f8573710a76c0 +size 201326592 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..4aa8be8d6dfb839bca42cebe9cd58e3ea97befae --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efe23880be7af131d89882a21a29ad642cf8ff907a5e3985d21eea9ce0ef0550 +size 75497472 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..8bb98d6dfcf1197f2dcc56b3e6306796b5839948 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2e0c1e5d2ca39c869f0501a7335c631b62cce77722bf17f7ecb8cc7950b6e0 +size 100663296 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8b09b3b37442eeb57bd9d067aadb9af89fb58a1 --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae1dc9d48b15b1f12105a96e45fa4cf9d5458112b5e0714f7b082a600f1c4ae +size 100663296 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..6760e1a6d7790a7e1b910a8b178adfb90b0f6cdc --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eaf53917a0e26908665a6792a01d9d323c4e7bd89e33f5ab70b61fb827b6762 +size 402653184 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..608fbc95a278efc69bdc45c165574ff63d6797ad --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb3d012d1205335ba503c97aa13a613e3eedfa57e5a31335514255c50130cf5 +size 201326592 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7a1c6b78983468006425cce85e608f611bc5fe3 --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:239102bdddb5372327a7a27b4e9689de792a256f75ee8a7dbcc6fef69b818d5b +size 75497472 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..236297e33603224b38f223400b972ff3d475080f --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8748f8b4430c5f0ed1b142a124292b1f4c0129eefaea559a431983a52cfff15 +size 100663296 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..035d267a798a0a2f972840817ac0289664c5d8dd --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06ef9caed3b86a501f9e4fd67e1b027d170b861b20479cec68c56ce9785ed415 +size 402653184 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..be02005a6998d81ae02fdcfef08a7a3a044ead01 --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:298aa6f09eebe2f0ce40c8dfa79062aca4993b77981dcda665e5744441ad7e76 +size 201326592 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..34235a580129526ce1c6ab5c1eff49fd40ca5fde --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0ca0ba263f471ce47d1d0932e2b994b705e87d08442e5590b0e0d59a280f92 +size 75497472 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..2b5cd2feb9ea06b4c8246870b83902636f002605 --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073fd3253d26b288e051a46c4bd12ac6e088aecbf0a6ba0c4a269538f94d39ad +size 100663296 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..19fec4da1b421ed479887e8cd7a778273a59345e --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e186525fa58da40cdad0ac85c6759abfd48204b10a138afbfeb9a749b9b2b712 +size 402653184 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..12279f7cfd82f0d30f1f0e22ca635823a235f91a --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:094400add5b8f88214f8af8baf8b4e76bfa77823b6534d5695f7bcc2fc157e68 +size 402653184 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..04f0b696d9a57f866a548f919e206b08c8cc209a --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be0bf42b225b07e2ab2659b9dd1e61e95961149934506a2deafbb365d3f7e04 +size 201326592 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..adef43de8b3764648e19f140d0298a2bd9868dab --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e2720dabf8d2862a45d8dd5a518a12af10f08295bdd70d142f7c1fcccf4318f +size 75497472 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ffdf80f69dedd54ab062cd0d30fa78dec56db28 --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9aa563085dc97ec9717b1ed633602e4c1d44bfce33603e3a3b488f7d80bcaa0 +size 100663296 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..9d201f729f9ec4b789b67c879fdfbc1a96e4f2ee --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f703d19a4d3ea39cde0b93ed8f747a074bff5ad3d6bc788383d3bf87fd8811d +size 402653184 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..745e15d739fd2ed4473c5a6252d9bdf9764b4491 --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f7e389a5981a112c9041b51ff5ad85b64077489d8f3702f8c468b3c8614113 +size 201326592 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..29bf80928f5f5c03077c32b0b2c566c3717c62cb --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4a7169120d2c28a14332ae93152e7b18adcaa4a2728fcd8a5afe874397e67bf +size 75497472 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..6acbb95f5e08dcf21af9bb6e8d5b5458bc0e8a3f --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a058f3594a578b9e945723cfcd55e18370eaaf0cff8fd50b17d0a03a91bc854 +size 100663296 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..14f41fb17279d4801b0a2b5763615d93c1277c0e --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8804267d6ad79d7a02ab2494b35f45bdcfc476724ebf4136f9f8ab8b3876b0e +size 402653184 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..e13321617d2508e1690e2b0cbb41d5971915a7ad --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:598d40e101fad03eef825c269962dd7dca65c1aed2efffed42f6ddb4cbe7414d +size 201326592 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..2bed41ad3f7cb8de7f4d665e1f32e1c61243cf8e --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756eacdaf283f8ce5ba58615fcf37b658b12cef5cb7750f86db1ce9bd5427672 +size 75497472 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..a35edb5483a2cffeb7bbaf73acaced5385563043 --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1c73a3c2598792d9bb352bd0222991dd32ab4dc797821595a6ef1170495f3c +size 75497472 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4ba218ef94a4ac23d6484440feaff299124fc91 --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7347f8451b1d6c22a76e0922ec35d42d02115072037f21afc03f3a943fe6c302 +size 100663296 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..fec606003fedad419ee5c4cd33b8bd45e024bccb --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1593f740d5f978f19840b128c6774f20b73a2aac7b0249b852c50b6b07393649 +size 402653184 diff --git a/params_shard_162.bin b/params_shard_162.bin new file mode 100644 index 0000000000000000000000000000000000000000..92f393d05ddcc29c5d8760a47ead1c28fcf16288 --- /dev/null +++ b/params_shard_162.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef76bce0b9a6a093d3f5fcd4e436dfd08587d07ea88260c7ddce4d7cafc513d4 +size 201326592 diff --git a/params_shard_163.bin b/params_shard_163.bin new file mode 100644 index 0000000000000000000000000000000000000000..53b53d2f59a492402017c6d009bebc42ad774f98 --- /dev/null +++ b/params_shard_163.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ebf8fb6f655085f685eb8b7de7f0ee1f3c92f4a1a017268ce312a16f183de68 +size 75497472 diff --git a/params_shard_164.bin b/params_shard_164.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c8ec697a8225ed3c88cb98ffadf61c04a2c718e --- /dev/null +++ b/params_shard_164.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9a646ff25f9d3b22fb1378af2adb53e628da6c82d4c5f415d160892f6b5dde +size 100663296 diff --git a/params_shard_165.bin b/params_shard_165.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c43db6f5ce7e0bc6d0fca1700c4d08d4b2804e0 --- /dev/null +++ b/params_shard_165.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4a0dc9c689adb6f0eba34aa9383bba07bce52bc69dbe705c109b054a619edb8 +size 402653184 diff --git a/params_shard_166.bin b/params_shard_166.bin new file mode 100644 index 0000000000000000000000000000000000000000..797b60c937f21b24d652d0390b3f52718b9d7f47 --- /dev/null +++ b/params_shard_166.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d12cf4527329907bc13b433b985b2ed0ac979594573f4dd2cc58037a67cec98f +size 201326592 diff --git a/params_shard_167.bin b/params_shard_167.bin new file mode 100644 index 0000000000000000000000000000000000000000..f83fa19d3c8aaaaea123feecbaacd6974a31477e --- /dev/null +++ b/params_shard_167.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c182dc6f3aaaf73b4c989ef610010287944b241f96c6a5690cc0819ca518d93a +size 75497472 diff --git a/params_shard_168.bin b/params_shard_168.bin new file mode 100644 index 0000000000000000000000000000000000000000..6634d80a8f8af158ebfd73d9f2c1644cf68ddee7 --- /dev/null +++ b/params_shard_168.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4743c013fe11661a4b7b0bc7cab04cfb1861d5b6010f003b5c2a6bc893d0242d +size 100663296 diff --git a/params_shard_169.bin b/params_shard_169.bin new file mode 100644 index 0000000000000000000000000000000000000000..134d6ea38c4566bea0760d34a7d112f44c030cc8 --- /dev/null +++ b/params_shard_169.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6970048a9579f544c3658b02ac1e5890424ee9f504f9a52b2227372de1787a27 +size 402653184 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4ab26ed1bfc970c27a62c75bb8f61a44ad3dddf --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed38812356447bdeb9ef9cfae9d9f679e478cca9f26e48c527c6c2db0c3e4e3 +size 100663296 diff --git a/params_shard_170.bin b/params_shard_170.bin new file mode 100644 index 0000000000000000000000000000000000000000..c17ab4d99f6b84b12f0cfe3cdeb9e518019d6a06 --- /dev/null +++ b/params_shard_170.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f87d966cf40b1abab2b2016f746377aff0de5faf93ea08a06671264e14a5337 +size 201326592 diff --git a/params_shard_171.bin b/params_shard_171.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef198965f24674ac317bb08bae59c2403469c856 --- /dev/null +++ b/params_shard_171.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506f0a997a624306d85d83aaae4d5f07fdfef47169999ca86b72e1e7dc681efd +size 75497472 diff --git a/params_shard_172.bin b/params_shard_172.bin new file mode 100644 index 0000000000000000000000000000000000000000..f93f4ea1633056cd4733fd33f8189310c39d8fef --- /dev/null +++ b/params_shard_172.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e88d77193b4be85795d8106933d484d50ffcc792cfaedbd74a50c25ec1a0a9 +size 100663296 diff --git a/params_shard_173.bin b/params_shard_173.bin new file mode 100644 index 0000000000000000000000000000000000000000..29acdf71bc60e6869e3b0436d8e97a76ae7423a4 --- /dev/null +++ b/params_shard_173.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e05209e6f169bb15eb6b1bc9b63a9c41a8240dc9f8053f9199e7fc1506fa6c4 +size 402653184 diff --git a/params_shard_174.bin b/params_shard_174.bin new file mode 100644 index 0000000000000000000000000000000000000000..32a60a64aeb69ae5eddd420506a2bfb0fbe0443c --- /dev/null +++ b/params_shard_174.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc16c5ef09e35a72d5c2b3c714ca6009a8a2b6a36735bc1e1acc2a3bbee56c64 +size 201326592 diff --git a/params_shard_175.bin b/params_shard_175.bin new file mode 100644 index 0000000000000000000000000000000000000000..c3503836fd425b54fbda800cbdbd9067bc694c40 --- /dev/null +++ b/params_shard_175.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84c36f1085aa595a56befe94ac71b59d7d30fcc436d51293b093a14560146b35 +size 75497472 diff --git a/params_shard_176.bin b/params_shard_176.bin new file mode 100644 index 0000000000000000000000000000000000000000..6061431b1fe835d663e2cb30961f0a3a4dbb78fe --- /dev/null +++ b/params_shard_176.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f141b0894b28ea032c6e2fb7e470bfe9c1cad37896f2460a510f267eb3ea2b9c +size 100663296 diff --git a/params_shard_177.bin b/params_shard_177.bin new file mode 100644 index 0000000000000000000000000000000000000000..c01e1616c18e7e586f369129f10da5eb153e5268 --- /dev/null +++ b/params_shard_177.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6819e259833750406068461e8b6b7464a0c70d801e99dd437d65c413a2847373 +size 402653184 diff --git a/params_shard_178.bin b/params_shard_178.bin new file mode 100644 index 0000000000000000000000000000000000000000..e2f09d2ca998fd03c938a64740829138ef59a79f --- /dev/null +++ b/params_shard_178.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d71ed6c1417d77574e63f3692c68ff8b4f3e34675f050fbf2eb65cd804f464 +size 201326592 diff --git a/params_shard_179.bin b/params_shard_179.bin new file mode 100644 index 0000000000000000000000000000000000000000..d747413ed882116c3e931263a76d0ec5d7cb6bdd --- /dev/null +++ b/params_shard_179.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f4b21ff911759006f831f2082d5eb3148fba527bbef92354f24ad3734b8d246 +size 75497472 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..a7a507c7e87963e07c895a77322158923a18e378 --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e904d3472e81ee950201ce26a1dbdd1c670735a2997ba4f574260ecc3576f69 +size 402653184 diff --git a/params_shard_180.bin b/params_shard_180.bin new file mode 100644 index 0000000000000000000000000000000000000000..94db0e77d2bf2cc09011b3000b5bc9d67df55ec4 --- /dev/null +++ b/params_shard_180.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff1598dede75627ade2c15ca87289cc27da560405abbcf785d3724202c563bec +size 100663296 diff --git a/params_shard_181.bin b/params_shard_181.bin new file mode 100644 index 0000000000000000000000000000000000000000..1e74a837332f9bb004f5a09b9eb022d069666f05 --- /dev/null +++ b/params_shard_181.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca6846fac842167e44ec6818ac818095193f88f577ad14223972697c1058df0 +size 402653184 diff --git a/params_shard_182.bin b/params_shard_182.bin new file mode 100644 index 0000000000000000000000000000000000000000..e745903675ffdf302d80457969bb12cca3977080 --- /dev/null +++ b/params_shard_182.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5dfb9549b631212ef90ff622fb87c6f98e5b39f176883382c1d8775fefa08e +size 201326592 diff --git a/params_shard_183.bin b/params_shard_183.bin new file mode 100644 index 0000000000000000000000000000000000000000..28dcf92722fb2e77f3a4a1089504ac6e6dfaee06 --- /dev/null +++ b/params_shard_183.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb194bacc7b7f67c9b4e0e2f6388e2c011aff57f3c1910d01f2eb9887aa8f7b +size 75497472 diff --git a/params_shard_184.bin b/params_shard_184.bin new file mode 100644 index 0000000000000000000000000000000000000000..4c0319884936ee330f3b68eda42d8ccd5f25ddee --- /dev/null +++ b/params_shard_184.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce087097bdd2814acd7423a0fcfcdaaa9d1bceec28c5d934d41a2f4b281abc19 +size 100663296 diff --git a/params_shard_185.bin b/params_shard_185.bin new file mode 100644 index 0000000000000000000000000000000000000000..fbd5bb1a952882f0588474ec6bdc8d2aaa4c5fd2 --- /dev/null +++ b/params_shard_185.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1459fe4b955110f45bb7790211ef7682ba8cfabd672620215b9b91d693453daf +size 402653184 diff --git a/params_shard_186.bin b/params_shard_186.bin new file mode 100644 index 0000000000000000000000000000000000000000..5d251b853648c3f1b6b32110f88563248e647bd5 --- /dev/null +++ b/params_shard_186.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6857510a811f1bef386db3f6c122a56195c0a39318fd5323b01969e958c56c46 +size 201326592 diff --git a/params_shard_187.bin b/params_shard_187.bin new file mode 100644 index 0000000000000000000000000000000000000000..bda7211ea24bea8f286660f417ca44e059fab2ea --- /dev/null +++ b/params_shard_187.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32c6c31b8d390fe175d5165cb997d08b8e6aa6123f0e69ae4186d331b0ab0d1d +size 75497472 diff --git a/params_shard_188.bin b/params_shard_188.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a1a951fca3356552d5c3db06cad3394ede2817c --- /dev/null +++ b/params_shard_188.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:946a39abf8aa18d20230c835c228ee76035b43e4ca06e58b06affe8c10849801 +size 100663296 diff --git a/params_shard_189.bin b/params_shard_189.bin new file mode 100644 index 0000000000000000000000000000000000000000..9edf8c89d71edb9f5d84f26e48c86faaddd44bfc --- /dev/null +++ b/params_shard_189.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ccbb9b4200c3a591b4c96649181148aa6ce278c2d0d84689003d102acdfb387 +size 402653184 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..aba09fcb01361f9b4465ff9689d0e26c78a8014c --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da956d3aba7caf05ad0fa84540aefcae7ac22ccb95fa67fc1ae8e46358e8cae9 +size 201326592 diff --git a/params_shard_190.bin b/params_shard_190.bin new file mode 100644 index 0000000000000000000000000000000000000000..0ed0d5bad67a6ec01d34b56180b92463ebada059 --- /dev/null +++ b/params_shard_190.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f69c2194a8e619046d00892b826e33584ddd39f2b0640f3b38ea439ba9856a1 +size 201326592 diff --git a/params_shard_191.bin b/params_shard_191.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c7ff59c84e37078d03407ece81f86f744796c55 --- /dev/null +++ b/params_shard_191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb1f2c2763d65c33adb09b5a2bf351d9f099711348f822c19880116a991f601d +size 75497472 diff --git a/params_shard_192.bin b/params_shard_192.bin new file mode 100644 index 0000000000000000000000000000000000000000..18e7be0a0fdd79a768f392ec4a5318170c7707d5 --- /dev/null +++ b/params_shard_192.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb4c8ee6360482e503c2285b0c80c81a15a59001967b2536552a8f6a4a37fb5 +size 100663296 diff --git a/params_shard_193.bin b/params_shard_193.bin new file mode 100644 index 0000000000000000000000000000000000000000..6bfc2dfd810ac615b663a800af86f8083a823f65 --- /dev/null +++ b/params_shard_193.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f4df254c57c36aa23c1405ac543ba464039e0f6972cf835aee00277ec6a96ec +size 1137180672 diff --git a/params_shard_194.bin b/params_shard_194.bin new file mode 100644 index 0000000000000000000000000000000000000000..1dcc46964a22c04535e9d29e8a3a3ff06bf98e7d --- /dev/null +++ b/params_shard_194.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b0b9d7fd5941cd56a29bcb83c51d84a1f0a4eceac49318806b4944439db2a80 +size 1191936 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a0342b347a93c9add28e35dbdd528d5eae3a533 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ee8bdf26d9f66c1908d47a3863fa11d190beea44a5b3aca7d63c7bec634688 +size 402653184 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..77ac6d4140cad8c84bd9412b47a1bc1d8796df06 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f0b316878c8109dca6b7b66b41ca1c66b96964da500e9b488ddf814a38c519 +size 201326592 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed55c401188e300b179db521f16b17b21b78362b --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56b38020de882e0cafafd0cdd319f9024e61ce0ab4de12511b7a6635bd7a37d9 +size 402653184 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..437a60058b79760e461111f476ee69cd18246e30 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f04024c976274dc5dcf7016daa7038d1372605e035a99497c641629b1761d5b6 +size 75497472 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..3962155cb0409becce021cefb7404fc38458bd6a --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:455efee261092231fb192db96f8f8574457988f836374000be00512c0922a8b7 +size 100663296 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..a081437ba3887e5058abe28d33778875ec7e1e83 --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6056d04ebf962bf5529f586aae54885bbaedd06fbaa8972793098bb6b763520f +size 402653184 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..893e5364243b9db293caad99f414d57a6e7c8a3e --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f45bc97be965aab29ef8b72cddf2b10a2ff843051b4de7c73b134e6c4f596a +size 201326592 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..252810c8eab67119fdcd29fd7673ba8e03aa1a07 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78e60a95155accd5ff26434dfe0a1564ae410d8b6e534590d9456ea69aca7ed0 +size 75497472 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..41e1cf2e827570f46fedaf4667145d2348dbf5dc --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29145b267c857413e86864ff2f0191f3acc31ffc6b18ce147c675d3283f5ff63 +size 100663296 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..613ae31ed13a32017a0d3339e26e3f17195c2cf6 --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d112e493a1a1a9ff4718469a772083d5a37e72648f8493179a6d433017702caf +size 402653184 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..9382a1acc23203e8dcd4fe70cd17ea155545ac45 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7e49935e81501c915a51572c58337452f41f230f12b161b6333f8d3e315847 +size 201326592 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..82d8d04fcc909e905f10e62503d25fac4cf3e01e --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0376eea46edf15494ef68b3e224c38e0c5cf455884f0499ef2057f6dfeda25 +size 201326592 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..12b6b9e7454972df13bae06724dd51065ab7ea51 --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49749b454e8dda288a9aab531c1f3eeceda7dc764da3a390b89f1a44c8aa93b9 +size 75497472 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c8955cf2a60d96c3561919a476880afa2283ac4 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f16a3a4a8c2ea7744cf37bc96d0ccbacfc15a662e2ffb4ecff36afc51c8c72ec +size 100663296 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..e24afe3760ba3ffd93ecbdf33f734776463d7402 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf1e051abad1fdfb3782ad4eeb911ba6e85119ce8c85bf49e0ac4f3f1e261ca +size 402653184 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f7a000e25dd06621c1ab6277ebf756a64c0c19b --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5480b90d504115727f43feaff7adc1dc74a810f3645706199ad16c4b7ed8e660 +size 201326592 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..388bfcae87dc1f934e395505d803a578f53a1a7e --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0befbe8ce0c0a28199e0678a397bcba3a196729bbadc5c8c62d2d86dc325a073 +size 75497472 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b6eeaa8dd9f7cef17fe7e6f1ea94bc23d5dbcff --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc2c724cd3f7b59e4cfdacbdfcb481266131b08e225e7878c6d1da87461e5cb +size 100663296 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..60eb89a6d803b972a4af71e8ec6f83f462c9ad08 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29f10bbe87daf91b7c4fc33762a7ab6862df37863d21fadfe4fed71d2638055c +size 402653184 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e95bee3d8075c8838308f60aba85c6cecdf889c --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c468c3a6226b2a05a4ae8a894b06857068b00b8afab21bbba0e069c885da8da +size 201326592 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..d6a6514e719b52c774c8fff6fb4e29bb70b83a23 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a2c780d54b4b270b88e1a847a301399da397679fe9b10901810dff25ea6d975 +size 75497472 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4b04da410edafbc7ab3e54e74dc54f758243e19 --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb591d89973685df0d7f25349b7f08233c17127c59a8f638472a174481877246 +size 100663296 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff553a5dc0bafe00238581f3a500514db0e22c94 --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:044185e88684fcd5785d3d9f5471ba63f30fcc4afe261de02da8d72ec3af03ff +size 1137180672 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4815d676cbc020bd74a76cdf59b853d2904d376 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3feda6df3f99003dd1a7686733c1164958392c2bc187b34c253a46beade57e0a +size 402653184 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bc586350d82a7f2a734f4d22e4fab6cd239c96e --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d89970a5f5c0734bd7b6406042bf05ed39ef6010caa9c2fa51b0152d92337a2 +size 201326592 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..4d0f238f687aa553641aa1154116d61dc983fb69 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d065ec7318c510aafbe095d780ab2d9dac99c85a8cc3d66fa913a3c007ded5 +size 75497472 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0f0bc922ffa7a7349ba9fd639bbe43facfa5426 --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aefff7e7b74ca685de9fc0771df66a6794a3df323537dd6d39337d046600ee5 +size 100663296 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..58f0ccaa5b083f5a9d9fdf6d7eefd7e2e29975e7 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713e646e6d5d25046bc9dc9776f0e69b5667436bd858ae3dad64267f8b7a8e31 +size 402653184 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..c31ca8e53e180823831306b9865b98e2cd44e090 --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca50da09757d4d64b545a8441efd42b49e842712684a752af1165f94eaf86455 +size 201326592 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..77feb68c55d9201bf744fce8ac871952c2740f92 --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116f3a277ccfb08e0f8f930841a2af3ada75c9afb61bbbf6f7e1ffb5360c9060 +size 75497472 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..b3646b7b00c613093a913a3c32b6cad146648573 --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc76a3eebee43ba7021fd475e39e11d88c3db030d6f34290fffec742122954df +size 100663296 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0385d1f8b1757fa5d3138091e88fe7387c46e48 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbb1d7aecd064ae97effabf9cbb921e148a97f3dd691bfd2857790015ca930d +size 402653184 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..a717cb07a6d7b4a6cef34fc8533c6aa7dfd6bd7d --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80fe3b798207bf013c59e03568708d96c62a2fc68a6307eb4d41e40c15fd2a86 +size 201326592 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..1dca31426c005119f792b45791ddfe6fedddca9f --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe812d15367e5ea4f55e0ec1996de549ff638648434eeb8faeaf8610fa3ec19 +size 75497472 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..58b42da9cfe2dca431fecc3f233fd08bec3af748 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5416d0536268fe86d1a833abf13a3bd9a9f32a36b2669cc9a11fd74302604a3c +size 75497472 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..cec29a8bf0d9f5b9f600946ab43e9b8843af63f0 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f011b753ddc47a3e0d35338e05d4525b0dcbdfc6016bcc9cd8496ab197da2950 +size 100663296 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8d06de98e9eb2b783baabe36475534f2a346d72 --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a15828ff1ddc73840dc4777394a1c668800bbd1f70c2673a9b7af268cf77f440 +size 402653184 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..88498b011df017ef56ab680ef66b923463a91744 --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31e32deb7ff1ca6bbab4a6695155730d6f8a30530f5af550f0744b85f18632fd +size 201326592 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..0795911806c34309398ac65b172cc7aecc0c2fea --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09465ca9f41773b5671c262862a96dd7a0090df1130bba53eef7c044fc777da5 +size 75497472 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..3726a0b6471203b05da161254811be71d4ffcfa9 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29079c1b7585ddebba1f7ab0940944edf0c05f9c7e00f3519100a043f1975dc5 +size 100663296 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e19ed6d12974e00223e1731ff201e2a3bc27530 --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a9cc68d30f07580fcb765833dae387f551cc9ef51ef425813d13232dec607e +size 402653184 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..8dc4da78ea940c141c641701583b29780f36a041 --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5302219f1a14c199a0e5cc184a7f65be4ffdb3e8946a1b4997c5a50bbc328466 +size 201326592 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..808f0c26130e7a87c95293ec5d4bae597bd0149c --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b283ff3ebdd446b1f5d108f061fc6a6941d28a9ba90572e60f66b6b1f0f91979 +size 75497472 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..08399979724d36fdfced07b6ad060f5b5bf20db5 --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c8947f51602a402596c34a9331fd9e993ab2fef24fd5fd7fbab25a72095185 +size 100663296 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c1203dcfac3b372558d508bd4e3ee2c89c09967 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d80cd8bc231670ea73cf33902a24a5e996849a682315f928e199dd4832f4d4 +size 100663296 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..df5720209bfc0fccf2958ae08a7baf0ce418f6cb --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b204dd8be2d1dcad464345b438c90cae01da1ce6b7fb75023c4d39393680827 +size 402653184 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..09414d77702d6bae47a3ed0a55d4d49c198c8ead --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20027564d5265e7263abae9d004bfd287b3eaa3b06984a3d0a8b9aa1979fa99 +size 201326592 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..9abf2b5787ef9ab28a469db9178cff8fedd06c59 --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:264e335694fdb8435fe1a053c875326d5ddd6be4732c9b46ad90f49d2e92285e +size 75497472 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1977cc0fb0aa1c407faf0491b8c5d33c93f9cbc --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7901cf57e876d7e2421a58bb327a92cfc416109b20e2fdde2db5551d33f76cae +size 100663296 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..1cbf575a55d52a6c0c58fba77f53ddcdc295b835 --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b15824e0b3b99694efc8f56b78fabd8a265d210e9abc6d8f9a88ec3a631eee9 +size 402653184 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd53f85a57450aa667883b023f6a18b98fda2eb1 --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf81f0adb6c559b8ab6a2c5e5f6813de622c9c4f53473686a91f83b2dd681cf2 +size 201326592 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..431dc971a818aed83991d7075aa9d382bbc8a168 --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4286d25a0ad1ef7890241f163a5eed1664972dd7c1fced536a0d5aad63452ed +size 75497472 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..764b2762c30efc4a662247f87d14b6d29577a9a8 --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb96ce9213212452f726c3e96b3e4a8eb84fa3aa6d0d6877b8f7ea3880daba49 +size 100663296 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..e02c90969106c351c40b9b054b888df97cd938c1 --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deba2d3022e9513e209be1b7521f4e568377b0ae18607738bf989e4e7adf3b82 +size 402653184 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c08d7ab1348969686a1c1f22ff2a1886bd5062e --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98edf076465df5abe2546d5a29a8aeaacee8fa4ae0ba74b73e084cd817a42da5 +size 201326592 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..542680604a92c5300178c4f3bf887eb57c9353d0 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e5538fdcf6367c115427969fb70821ff932faff624610559d3171d4d6934f9f +size 402653184 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..923a19b2341c96166119137ab92d4e334e759447 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5625f014b87fc841b96929fa30c00a4f2e0a2d8d888f6b1124cfcafe9e24a5 +size 75497472 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0bdf91b40d1c8653f8fe98d828c7a5371a42e9d --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:453506aee2113ae110ff3cd8e87f387aefb8caa17df689a43f35cdc45b212111 +size 100663296 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..5aacb28f92990ee2e569635ac106856d31e435c2 --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcbac9f2efa6069be5e3e6d0688d7a372219199dee7b92d9dd91747649d814c4 +size 402653184 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..0efa3b74532e68d7e55ef74ba592929cbddae8c5 --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8146082859f0122066dde2c7db23a4267e7e7635a2c087b81a93e5e8690e7f0 +size 201326592 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..cc6fafbaa0cded20b894ee313e39347bb83a6d14 --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4efe635671090973d9702da9469b609be1b2aa8bd2f6e6770b1246ad8fc2db19 +size 75497472 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..672c51c63cf7a5ccb230e0c026bc78bcd2b55038 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f60bc0c9b04ec372a20ba2a2b19f3799e72bd85fa84789d34924a59348cb6a8 +size 100663296 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd5278c7316ddcd12a443a4a1b6d0317efb963c0 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f2e07736dafeb322a41d075c9775aeb67204fa07488e1b2026a29ec65ac4b1d +size 402653184 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..796e29df19627ea77d2b5ceafa693046fb1b57ec --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae5a085d791f07c122a7140dde4c8106f268285a45b5bcd5a3c4d4a82f0a2b8 +size 201326592 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..207feab14295f953c8a3a208a64bd30b80583b0c --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:606b6b0c84261c0a4c9193f2bcc8b074503b94612d4be1138c40f328f61c13d7 +size 75497472 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba5314465b7b4e55f8cac138931d766ddbc2a0f5 --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:413dc054cc0c5c8757c57115f7e9d9bf7f81378301f91adea66a9e41c85285dd +size 100663296 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..149c3abe9cd1ede1d428618d80caee138934109e --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c566043f8e1dc0da67dd2be48a3cec4a99e9284f6299cbb782e781d61f33654 +size 201326592 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..48c0ec4bd1cf700745f9aa2a37624cacb7808acf --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca70ea82be11324eb6fdb21cb9797c992a4cf0f2be24389055bbb57067730c3 +size 402653184 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..0911dc1cee530c1e927219f8e9a1d56d066ef563 --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206a87974aced41922e4ae042ca5d1960c325cadaf0e90e3bded81832abfe283 +size 201326592 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..45cf2931ce59f31336e51394f6026984661285a5 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe81e44bcf689c04df48a8518336a0d6163daed07103059489265b1686460abe +size 75497472 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f22eb25e8149440dfd178719f8c14643868d6b5 --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbc25fe7b3169ef6e817e1bfd9bd563b49478afe5fb8a7a345b1870366a6453e +size 100663296 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..86dcaae3691dc71618673f75385f7b9848247d5a --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff4cd52e501b9b904207d6b16cddf0ca67d51b19e5677b4ab32385793e3c867 +size 402653184 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..3ad0d93e630387d0bfcaba19a9927f42abe2a077 --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6224e5fa4d30a92cd8648c4f8925dac094408f004c6299ff3cc956489103b66a +size 201326592 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..13867925508130f5adcdb70eed332c587ee0eff7 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c0117544468fb22e6905cbe70a7ba469a0a991bd8af3cfc6b9fab5e46547f3 +size 75497472 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e26ee6e5c97788fc807f98d8500e1676242bdbe --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e34759a305f4ac3258db262833d481ff93aea97e8a8f7ed445ac2c227db426fd +size 100663296 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4e52b7d2d43e4759a45fb1a3ba01455494edbba --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:282ce052a037b5c74b2a7175113f391e096d2a7ea25f48e00721ff406bee892e +size 402653184 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..13eaad7c8188754090d9381ad9ca073c431d38a1 --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:126fa1cc6eb17e8c4974acf20d6815f90eafc7163c8d6472c684fae32c204aa9 +size 201326592 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..1a6e90adb7748abc67130ce37c57451819cd98db --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f3bba5df06b092f24f635459224561a4ce7cd00fe0deb13ea724a5f5e97152 +size 75497472 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4c168dbdf13d540f9c867aaac70caf5a195e702 --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc0de287ea213b60d2bdec1e012d19858095527894c245729ff80f93042cce1d +size 75497472 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..e414245b5ab665bb510690d67ef0d9fce41bb88f --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6b66e40677b95801297ace8a1eec3ed7508845dfbc029e59d0c90acdae63421 +size 100663296 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..95968543084c5116346b74087ac0ec7571cca9a5 --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071fec37ee201aec50d69f8cbe4caf1ef7c64b9297e3b8215b1552b64d677869 +size 402653184 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..5425948a8aa6793e536abe9fa09f7cb2410fe329 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9fa909d51c84a2537fa6f10b18c603275faf371c54aee34d1b575cc197a3e3b +size 201326592 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..930105a6778d479e77a3208a6a3f31d3aa753055 --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d674024c8ed35b1f1c6403bd0d77353b1622b104be33cde26c2fe1b48ca83f1 +size 75497472 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..67ab761a0ceb3bde182085e5d55a221f91a9e0f1 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de5672da7cde1eb7eaafb4ac703ceed30b0e3d01d0abac1667cff3459a9c780f +size 100663296 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e3322df34f714b02d091fefc5fd6d7971fcb3e3 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90f3fed64431ce1d45d642b654e49854f1b976a48d8a0b9cc2b71c79e5f255da +size 402653184 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..07488741f2a78ce624808555259060636f5fcd74 --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:427ca788f16efe8d6c816af600bb04a3720bb491eaacd9d44a1dc61c02d1e63d +size 201326592 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..4256403272a2f8e338f84d93ed79ad1c9533e54b --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5a91c774ef96edf197095bf21eedc2f71010bc6276a46037a86a72bcb2f3af +size 75497472 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..28bca56e4c3d489eec1663cc698291b46d3446eb --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ad2cc494f5cabf6d415848ec20e90eb7a05ee3c403a3a42c6536c5488ce8b2 +size 100663296