diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..61c4bd5093181bec3a13e17c2f14340028e0ffd6 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,7183 @@ +{ + "metadata": { + "ParamSize": 485, + "ParamBytes": 11172753408.0, + "BitsPerParam": 4.097919499366067 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.0.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "b9b9e5d249b538a2a23cd9d6019981ce" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.0.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b75a004c453f62cb53310dd9f39a4e50" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.0.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + }, + { + "name": "model.layers.0.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18874368 + }, + { + "name": "model.layers.0.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21233664 + }, + { + "name": "model.layers.0.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24379392 + } + ], + "md5sum": "e6520c88c12f921f441acee5398ff07c" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.0.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "f3ebb9920e8b85c57da98df48847ce9d" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 284295168, + "records": [ + { + "name": "model.tok_embeddings.q_weight", + "shape": [ + 92544, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 284295168, + "byteOffset": 0 + } + ], + "md5sum": "ca14145a0c0c4c397f63d05d3efc2835" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 35536896, + "records": [ + { + "name": "model.tok_embeddings.q_scale", + "shape": [ + 92544, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 35536896, + "byteOffset": 0 + } + ], + "md5sum": "0ea7afeba332ab1e5b9532773d69a3b1" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.1.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "77dfcb6bdbf516add8ecfff6d44965d2" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.1.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "4d57d99f602e5e7564264495c55bf3b6" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.1.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "1692de5d18f15e7c01bb91a26dc0230e" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.0.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.0.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.0.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.1.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.1.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.1.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "98e4b0820b49d5bccf6fe1dbb8be7ce2" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.1.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "72a985405bb3d53f60b97bf1e2332e2b" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.2.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "cf1fa92d5b1a4100c6549a2c884b4983" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.2.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "fe5145ac7899a1d1de150d2ebc809cff" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.2.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2034c0e4cf1503838051c15fed1a11bc" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.1.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.1.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.1.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.2.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.2.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.2.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "238d86afda94541e05ffba291879c288" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.2.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "b038ebb996dcdbcda9e26155429e364f" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.3.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "e9f17c0201ce0717438d68866358cd96" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.3.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "8fbac1aab61a4fc5a7c43923d2318165" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.3.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0937017c79435c4e9fe98bb3e03f40a6" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.2.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.2.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.2.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.3.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.3.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "a36f20dc7a6ffe035aa2583d09804c63" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 31457280, + "records": [ + { + "name": "model.layers.3.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.10.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 12582912 + } + ], + "md5sum": "2bba0fd99b16bc9c746f856e35ebdd73" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.10.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0ffab72d9b34516e2118eace3282a859" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 30683136, + "records": [ + { + "name": "model.layers.10.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 0 + }, + { + "name": "model.layers.10.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 2359296 + }, + { + "name": "model.layers.10.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 27525120 + }, + { + "name": "model.layers.10.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 30670848 + } + ], + "md5sum": "721df0faac45e9bed34d03d5722df4fa" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.10.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "e06a46bd4ff4616470764256b08ccaa5" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.8.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "e94c72f18607594bf53fca9f8ab6e9ed" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.8.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "a2b1f939810b4c0898f0503237eafac4" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 25190400, + "records": [ + { + "name": "model.layers.10.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.10.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.10.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.8.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.8.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 18898944 + } + ], + "md5sum": "c8057dea8cd1821e44c0c9dd91c41d3a" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 31469568, + "records": [ + { + "name": "model.layers.8.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.8.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.9.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 12595200 + } + ], + "md5sum": "1466895e1c5cbc65be0449eae1ba0765" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.9.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "1c148c5952261b2e18fd0a68e1edd1c9" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 30683136, + "records": [ + { + "name": "model.layers.9.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 0 + }, + { + "name": "model.layers.9.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 2359296 + }, + { + "name": "model.layers.9.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 27525120 + }, + { + "name": "model.layers.9.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 30670848 + } + ], + "md5sum": "2113efd5882d73352a9dca055ccb605f" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.9.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "b4e775cd3ccdb408b60c073ade853922" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.11.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "97fac31ac46ddf3359658e56238b008a" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.11.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "1b10c5106b6f876782ff41ebcbb8c55e" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.11.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "fd7a2553ea053177b9c55ac60d7fba99" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.9.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.9.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.9.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.11.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.11.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.11.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "d7984a5f3fe1753cd27283f9d0159c6b" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.11.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "02fae08b842e37606de9c803d5488f48" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.12.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "aa42bea3a653e85154609159e5a73fcf" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.12.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "fe075a318e0f8b16a4d2a8368d66413f" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.12.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "45c07eaec64f198398cffa978d9a83f5" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.11.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.11.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.11.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.12.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.12.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.12.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "162ac15e1b59aeb7d672ca7ec7fa4f42" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.12.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "be62d70497cdc602815537e2b6187b40" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.13.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "3a2b112ed21e5a0b5420a8c62d458bca" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.13.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "cd5d417be0799a24a579c9fb626146a7" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.13.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ee35ec38f8c514405574ed5a4f3c0d1d" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.12.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.12.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.12.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.13.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.13.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "f24ddbaf32a5d7f5b71c7e5cee8d01e0" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.13.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "b5aa78602d686a8a798ba8edc5ea12a8" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.14.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "e70489449fb9987fb1923e5ae5f20f3e" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.14.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "2cbdca22297f8fb2492e184b2498c5ef" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.14.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "bf26d2932c39e61d8f16d72d1a1007cb" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.13.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.13.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.13.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12595200 + }, + { + "name": "model.layers.13.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.14.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.14.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.14.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "4c345ead3a6d1626b0fa94d39f760f42" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.14.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "05ed145f96a749f1e5485007ba9bdff3" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.15.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "91b196f1ee5b0c9fc7eab50972cfb94d" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.15.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "46190f54ec12b2d53e0f4a39ff7606e0" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.15.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "65a10a2088cbe633298f90961d3008c4" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.14.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.14.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.14.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.15.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.15.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.15.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "5422bdbf876020a942b0ae48542e997a" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.15.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "40d406373edcfe671148f51c58188b3d" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.16.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "f36308450b85047579030599cd4807fe" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.16.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "5d54b81a65ed98f8cb420b3ac5c810b3" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.16.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "92128fdd9d2ce3d54b5cf38b9bc28391" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.15.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.15.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.15.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.16.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.16.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.16.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "e6888c0a747108846cc9f2eb2cb2c98a" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.16.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "246725ecc77323925205f98ad2ad48f9" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.17.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "bf703b923c7bab71f5bf4e4b5f892a76" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.17.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "3d97de2553397e1bb18768648aa64868" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.17.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "76dcedeef122b7058d63692923aef750" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.16.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.16.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.16.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.17.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.17.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.17.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "47a0c159a9a9a3fb72c2b811faf05d0a" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.17.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "490c21a440f5e1714261de6a9549760c" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.18.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "db9a510efeca4751586b1ba77c862e90" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.18.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "7b040c1c18f4abc6b9a2e61411dd13b7" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.18.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "38dccce8fae7230bdaf6908b657314df" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.17.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.17.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.17.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.18.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.18.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "14a71172fc59a14a8f2f3c5e9b343fa3" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.18.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "b09d8cac1fa6217954b45c6dd9bf8a5f" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.19.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "7d623a78548db9de6ecb0ba26caf9473" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.19.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "830dd81fda54b730aa38974808d42f8b" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.19.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ecdcdee88ef207c0edfff16c4963c792" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.18.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.18.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.18.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12595200 + }, + { + "name": "model.layers.18.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.19.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.19.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.19.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "af9790c05f42784abfeda3221644f278" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.19.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "353670f439163af331a12230bbb91c31" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.20.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "68d29e416891959e83934fd381c3d5d5" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.20.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "e68baff97678fedcd3690b52f3570b6f" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.20.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "23b1527e1c6ca325159ad712bb0d9392" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.19.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.19.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.19.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.20.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.20.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.20.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "43e154db72c887328011b222eddc1d55" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.20.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "13717ffad5b2cf7c094193bde6a283d5" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.21.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "37274533a84b02617807533fbd266104" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.21.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "c2f2273008df8d15839af1d97d24dc1d" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.21.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "31b73de45831f78b149432353e767fd1" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.20.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.20.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.20.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.21.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.21.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.21.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "3de2c2a06fc1c7ffe7167fe61d34680a" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.21.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "86af285350ed289af29807476b3f9b97" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.22.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "89aecee669e406a982e7ea38e48d5e5b" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.22.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "c7d7401860f343773355a3c115f23f8b" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.22.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f7f068722b55e80671ec8d759209c9ac" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.21.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.21.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.21.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.22.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.22.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.22.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "00d5d456e1cab93959fa3cd1714fe941" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.22.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "5ebe811f4c8b0122fcdc1060af17df4f" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.23.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "8471703fa9b94b2c3fcf5eba6455dd60" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.23.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "76f0d2a2efcae8fa029a95f8ee24a246" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.23.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "4a6b1934376dc0218dbac30ed21a9d5f" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.22.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.22.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.22.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.23.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.23.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "f44fe42d3a651dd8833e7bf0e00bf3a9" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.23.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "ac1dc6aaca1c4d25bbd6a4af1511ff10" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.24.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "ba7c52d984110124ed7f4baa601ad9ab" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.24.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "fbb39581ba624860e4669edfba7247e1" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.24.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0399dc767317b8c3adc8f4ae04f2e113" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.23.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.23.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.23.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12595200 + }, + { + "name": "model.layers.23.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.24.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.24.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.24.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "b5e0a5bc5eaaf33e740699713867945f" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.24.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "abecd49f7941e61eea6b8c100cbcdc14" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.25.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "64399e2619d7a68fd741391cc395cf20" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.25.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "5321c22526b257abae7ace77691f8f25" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.25.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "fa386f927b426e09c683e2c0d7a6af69" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.24.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.24.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.24.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.25.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.25.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.25.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "e99c9703a632dfafc70450a02c4ecd9d" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.25.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "f0a979ea49807bbe454f4a697e6a6af0" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.26.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "a0f3fe8acc8c07a35822ed17144eccd7" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.26.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "22b9e6d91cb37f08c0f50dc0b336a60a" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.26.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f40f12f4b4550c84248a2efc1b7bbb36" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.25.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.25.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.25.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.26.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.26.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.26.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "e635be28861255c987c0b2f55e4811ab" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.26.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "4de9a0fa239fabd4ea050e6ad13eebdd" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.27.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "05170ab9db2c8aad45f180ea988722e9" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.27.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "d46ebfefe27eb12184a000ec9c408610" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.27.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b42151e035e34fd5211c53d960d6b8b2" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.26.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.26.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.26.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.27.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.27.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.27.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "2dca9dd7364013a355cc0cc816eb51ab" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.27.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "0a2c75767433aea6df65cbc53bec2167" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.28.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "2b59db67da1499944f0ab0a729bd7154" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.28.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "f28b8d9086d55030b4308cf42bac76ae" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.28.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "345efd5241119907c753fbb3db159cf9" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.27.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.27.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.27.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.28.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.28.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "51f608415b50d03292e428f7346f8858" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.28.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "4d589f4ebf7397dea54d54df9c60f02f" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.29.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "2e9327a41378044126474c294689a3fc" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.29.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "593cc919dbc8eb0d75eaa59b0b3ef6ec" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.29.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "9bad7a0e49fb4f8fa4147214514b4883" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.28.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.28.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.28.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12595200 + }, + { + "name": "model.layers.28.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.29.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.29.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.29.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "576d510787bfb1e7b012a0c52da43c4e" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.29.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "b6352dda9da320bd8a71fd182f2fcf92" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.30.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "8e83e004ea05000f072f5086400a0682" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.30.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "9e2954aadd935b9e64748a49abf7202d" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.30.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2413d9696a13000692c530d69ceb5f98" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.29.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.29.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.29.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.30.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.30.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.30.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "6c4381ff3020c4b4bcdd27c3aa20882c" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.30.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "42f17b9c6aea608c2132b8a5414977e5" + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.3.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "dcdbdffde2d4812ce4c25c4ab293fff3" + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.4.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "0d441147c8c220d184bc7a29a7c878c3" + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.4.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "d614ff9d28eab46ca9e2c7019486ef92" + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.4.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "bdd6f89340e69f6715dcaedf8aa83781" + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 30720000, + "records": [ + { + "name": "model.layers.30.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.30.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.30.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.3.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.3.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 18898944 + }, + { + "name": "model.layers.3.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 25190400 + }, + { + "name": "model.layers.4.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 25202688 + }, + { + "name": "model.layers.4.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 27561984 + }, + { + "name": "model.layers.4.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 30707712 + } + ], + "md5sum": "c8de6ad9681b6e394bc8819849b03756" + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.4.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "7cad850ad5042fc7f5a9fc8cb0874308" + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.5.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "915fc8f2006351af222d37a9044dde10" + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.5.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "972f85a3f93ae5f84bff1da4fa5e0030" + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.5.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b73ac7ae2b42939e5eea0eed24c0959e" + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.4.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.4.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.4.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.5.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.5.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.5.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "8a319ed0157880eb0e20298ae24a9137" + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.5.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "0c4b8414a4671aaea6b15db3740089c0" + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.31.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "e7001ce4fc17f9de8ec82fae94ff06aa" + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.31.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "7a25b3067ac0d4e6d240b588ccf4d37d" + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.31.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "9da3d0628fb4d6bbd4ef79079a329765" + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.5.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.5.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.5.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.31.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.31.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.31.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "055a8997ca2eee22cd74d1b45f01bead" + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.31.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "24a5a4dbc97c24e14f5813d2d3203bda" + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.32.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "78cf1b841c2d8bca6eed41273d6842e2" + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.32.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "6b4a25b89401c71edd3e3e9fd1cf8b8f" + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.32.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "95ef384812d5bcb40783faea1485d38c" + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.31.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.31.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.31.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.32.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.32.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.32.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "68289130bb93e6f4eac3bdf3d284b401" + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.32.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "a2d72dbf335134fa3c889848a0264f43" + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.33.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "d82c9855b12685d6de514a7923332cf2" + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.33.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "5834dae9f685eeb46df9ce91a4ae6f49" + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.33.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "281aec78040f897d50bba3dc23421143" + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.32.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.32.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.32.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.33.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.33.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "d11703fb84b835d9e1ee31e75753908b" + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.33.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "d48c63086b925cf7880dbb60170aed98" + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.34.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "0570540df18fc7cfcfe6417c2b976400" + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.34.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "8db337e43f10305f1dc9ca9f12999301" + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.34.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "adec4a6bd21f3574bbd467bddae41451" + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.33.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.33.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.33.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12595200 + }, + { + "name": "model.layers.33.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.34.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.34.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.34.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "63bf25fe91c0791e55de7b2e8b19a4cc" + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.34.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "77f3f7ffb311e4b9a9ca02cffd053ec6" + }, + { + "dataPath": "params_shard_162.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.35.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "93d218d704627aa09e6795f93d91250f" + }, + { + "dataPath": "params_shard_163.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.35.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "dc41359b12ab75c08ab15da606f1813d" + }, + { + "dataPath": "params_shard_164.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.35.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "9e5e83ff86b12484dd4e71651e9c2a2e" + }, + { + "dataPath": "params_shard_165.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.34.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.34.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.34.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.35.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.35.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.35.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "06aebcfd006c39b66d096ec2ad7bd0db" + }, + { + "dataPath": "params_shard_166.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.35.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "96da9a8c9573fd0ce9e5fa3319b3ce79" + }, + { + "dataPath": "params_shard_167.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.36.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "18e21374c9266abf6a1893f6b19824e1" + }, + { + "dataPath": "params_shard_168.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.36.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "4f732c8876e920461a3ac01bf1db04c4" + }, + { + "dataPath": "params_shard_169.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.36.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "b6447ad2d5fb20fdbd4f2892b8a03f54" + }, + { + "dataPath": "params_shard_170.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.35.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.35.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.35.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.36.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.36.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.36.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "c06d8df77c349eb5f0e9bfa3248c6e3e" + }, + { + "dataPath": "params_shard_171.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.36.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "dede3e093af0ac37893fa06367aaf846" + }, + { + "dataPath": "params_shard_172.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.37.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "9ac03336871aa4003a8c40b5ad0429e9" + }, + { + "dataPath": "params_shard_173.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.37.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "3e4004827b55b177a7ba54d3592bc1b0" + }, + { + "dataPath": "params_shard_174.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.37.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "2481e0b4d019163e0edfe2ae03393001" + }, + { + "dataPath": "params_shard_175.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.36.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.36.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.36.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.37.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.37.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.37.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "0474791c9ced2b4366cdd93234349050" + }, + { + "dataPath": "params_shard_176.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.37.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "645222585421be65fa6708fc85743a42" + }, + { + "dataPath": "params_shard_177.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.38.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "79061c56e9d8f780488219cfb82d3d1f" + }, + { + "dataPath": "params_shard_178.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.38.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "46bda62cb8057c1f52ae35424526dc1b" + }, + { + "dataPath": "params_shard_179.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.38.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "9662209a638db26ba256c909b99a34ad" + }, + { + "dataPath": "params_shard_180.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.37.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.37.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.37.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.38.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.38.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "48354f641c85a8d5988634844e168b85" + }, + { + "dataPath": "params_shard_181.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.38.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "00b0cb59d8217ae84612648a467ac555" + }, + { + "dataPath": "params_shard_182.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.39.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "e5cbe25654de4a7b204a3bb524335f9d" + }, + { + "dataPath": "params_shard_183.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.39.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "5478c9f09b9766d3b423114742828a6e" + }, + { + "dataPath": "params_shard_184.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.39.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "dd2f6f845ee3825755f8e566cc8d2c3d" + }, + { + "dataPath": "params_shard_185.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.38.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.38.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.38.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12595200 + }, + { + "name": "model.layers.38.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.39.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.39.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.39.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "84d4b73a97b64848a6474d89516de110" + }, + { + "dataPath": "params_shard_186.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.39.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "08e0d3541b27e6e0aac96c6fbba8826a" + }, + { + "dataPath": "params_shard_187.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.40.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "81ca8b31e6c7e67cf7a94ce64753099b" + }, + { + "dataPath": "params_shard_188.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.40.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "c6eb99b73593a242a4a449193041a921" + }, + { + "dataPath": "params_shard_189.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.40.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "f2cd3d7160965b9f6561e86558c5373a" + }, + { + "dataPath": "params_shard_190.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.39.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.39.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.39.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.40.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.40.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.40.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "46a45114942ac1536a5bfbbbb258edfe" + }, + { + "dataPath": "params_shard_191.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.40.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "8d5c77f4235102f10fac0edffda3709f" + }, + { + "dataPath": "params_shard_192.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.41.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "fa4ab53f55f372541841f40b9e2a8cc5" + }, + { + "dataPath": "params_shard_193.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.41.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "b95b1f1845e488c54d88d517eab36217" + }, + { + "dataPath": "params_shard_194.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.41.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "0e87a108ec599d27216e682a6c819421" + }, + { + "dataPath": "params_shard_195.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.40.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.40.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.40.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.41.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.41.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.41.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "810fbd5a022bc83f49588f0652187512" + }, + { + "dataPath": "params_shard_196.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.41.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "7c96e0abf603520439cc06e66713527d" + }, + { + "dataPath": "params_shard_197.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.42.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "4cad6d7a1f0f0b6bbdbc63ad2ec9b19d" + }, + { + "dataPath": "params_shard_198.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.42.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "a01c4ec3d3566a6ee9b565733bf1d950" + }, + { + "dataPath": "params_shard_199.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.42.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "ab36738df336067dd4ca9128c278df1e" + }, + { + "dataPath": "params_shard_200.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.41.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.41.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.41.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.42.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.42.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.42.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "a9ae49484edcb9c4c6f49dc1987a9569" + }, + { + "dataPath": "params_shard_201.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.42.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "f15f494aa91d4630037100b7cc223816" + }, + { + "dataPath": "params_shard_202.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.43.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "bec4b8d962fd790d33b672bf28ade8f8" + }, + { + "dataPath": "params_shard_203.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.43.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "50fcebef2f22b3a70553d627748d7bde" + }, + { + "dataPath": "params_shard_204.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.43.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "bc2cc08f2dafd46150c5e6fe11f557eb" + }, + { + "dataPath": "params_shard_205.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.42.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.42.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.42.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.43.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.43.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "44c8668d170eb42a9bdc808fa40e4e3f" + }, + { + "dataPath": "params_shard_206.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.43.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "bfb97d805c9de9cd897d1482fb7ac431" + }, + { + "dataPath": "params_shard_207.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.44.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "962e406c298e9a03b4b816bc98b6423f" + }, + { + "dataPath": "params_shard_208.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.44.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "fb5bae95e382db294d05491b63244046" + }, + { + "dataPath": "params_shard_209.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.44.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "58b8076966f4cdd9833ea641a0aba4a9" + }, + { + "dataPath": "params_shard_210.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.43.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.43.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 12582912 + }, + { + "name": "model.layers.43.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12595200 + }, + { + "name": "model.layers.43.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.44.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.44.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.44.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "8cbf2ae05b0257047c056673f64aab40" + }, + { + "dataPath": "params_shard_211.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.44.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "78c64985dd1e09e3d053e3da668a8f82" + }, + { + "dataPath": "params_shard_212.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.45.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "1ad65acda5fbb096cbce23821100d0c8" + }, + { + "dataPath": "params_shard_213.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.45.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "dfab68d1cbb76d655583d24c6b809c6c" + }, + { + "dataPath": "params_shard_214.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.45.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "7f3125368c8e829120b04168d9446726" + }, + { + "dataPath": "params_shard_215.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.44.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.44.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.44.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.45.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.45.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.45.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "e93d197cf530def9dc0ccd25dee07f71" + }, + { + "dataPath": "params_shard_216.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.45.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "2b9e842bf09a26e1031090aee3f33e78" + }, + { + "dataPath": "params_shard_217.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.46.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "89ce957b587abf7bcca0f5f54b7092ba" + }, + { + "dataPath": "params_shard_218.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.46.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "9429ed983670223155944d2a4a865031" + }, + { + "dataPath": "params_shard_219.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.46.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "9d632c55535cdce5571ae9692a5e8f7a" + }, + { + "dataPath": "params_shard_220.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.45.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.45.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.45.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.46.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.46.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.46.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "be8fe44dfff8ad5da154c060124b5a27" + }, + { + "dataPath": "params_shard_221.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.46.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "e73a84dba7df3edf3212aca4d43b892d" + }, + { + "dataPath": "params_shard_222.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.47.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "7a0791319f2cecc1731130321ccb01cb" + }, + { + "dataPath": "params_shard_223.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.47.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "5c3e84b69f0c7a3a63157560fa361b54" + }, + { + "dataPath": "params_shard_224.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.47.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "67efaa8dc17af7cbe4a10922605975d6" + }, + { + "dataPath": "params_shard_225.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.46.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.46.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.46.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.47.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.47.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.47.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "ff36f2a1a4a79fd1edf4d84753c06fe1" + }, + { + "dataPath": "params_shard_226.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.47.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "7b242ef01f8bc94265b14c88f4fb5a85" + }, + { + "dataPath": "params_shard_227.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.6.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "4096c8406ed4e677033af46ad337d0df" + }, + { + "dataPath": "params_shard_228.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.6.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "ed49904cb5632a1ebad2f2247c5d4fc8" + }, + { + "dataPath": "params_shard_229.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.6.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "fc7e1357057d708152c38af23e367a85" + }, + { + "dataPath": "params_shard_230.bin", + "format": "raw-shard", + "nbytes": 24416256, + "records": [ + { + "name": "model.layers.47.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.47.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.47.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18886656 + }, + { + "name": "model.layers.6.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18898944 + }, + { + "name": "model.layers.6.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21258240 + }, + { + "name": "model.layers.6.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24403968 + } + ], + "md5sum": "40c0dc0ccabfe5f1d9f78b726a360031" + }, + { + "dataPath": "params_shard_231.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.6.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "cc7f3e7e05fdb6a0c73600ef94990adc" + }, + { + "dataPath": "params_shard_232.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.7.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "fde36954854070812585cb2c59d503ab" + }, + { + "dataPath": "params_shard_233.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.7.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "18a104c8923e0d56d349f11f43793f0f" + }, + { + "dataPath": "params_shard_234.bin", + "format": "raw-shard", + "nbytes": 100663296, + "records": [ + { + "name": "model.layers.7.feed_forward.gate_up_proj.q_weight", + "shape": [ + 32768, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 100663296, + "byteOffset": 0 + } + ], + "md5sum": "7864bfac4b3dc9bffd17fced37cf9be1" + }, + { + "dataPath": "params_shard_235.bin", + "format": "raw-shard", + "nbytes": 24403968, + "records": [ + { + "name": "model.layers.6.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.6.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.6.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.7.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.7.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + }, + { + "name": "model.layers.7.attention_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 24391680 + } + ], + "md5sum": "fb98f5558e6c59c07776b7b225f736c8" + }, + { + "dataPath": "params_shard_236.bin", + "format": "raw-shard", + "nbytes": 50331648, + "records": [ + { + "name": "model.layers.7.feed_forward.w2.q_weight", + "shape": [ + 6144, + 2048 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 50331648, + "byteOffset": 0 + } + ], + "md5sum": "6facd90a35565420697823941fb45f41" + }, + { + "dataPath": "params_shard_237.bin", + "format": "raw-shard", + "nbytes": 18874368, + "records": [ + { + "name": "model.layers.8.attention.wo.q_weight", + "shape": [ + 6144, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 18874368, + "byteOffset": 0 + } + ], + "md5sum": "3ac01a84379a87490d93c3556016fc7c" + }, + { + "dataPath": "params_shard_238.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "model.layers.8.attention.wqkv.q_weight", + "shape": [ + 8192, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "fde46571de8b1829bf5efac03918bd9c" + }, + { + "dataPath": "params_shard_239.bin", + "format": "raw-shard", + "nbytes": 284295168, + "records": [ + { + "name": "output.q_weight", + "shape": [ + 92544, + 768 + ], + "dtype": "uint32", + "format": "f32-to-bf16", + "nbytes": 284295168, + "byteOffset": 0 + } + ], + "md5sum": "55f61b9267d7e0afbe4a1198dbd3d3b0" + }, + { + "dataPath": "params_shard_240.bin", + "format": "raw-shard", + "nbytes": 35536896, + "records": [ + { + "name": "output.q_scale", + "shape": [ + 92544, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 35536896, + "byteOffset": 0 + } + ], + "md5sum": "89f25a89c637723b976edcd9b8abe8bc" + }, + { + "dataPath": "params_shard_241.bin", + "format": "raw-shard", + "nbytes": 24391680, + "records": [ + { + "name": "model.layers.7.feed_forward.gate_up_proj.q_scale", + "shape": [ + 32768, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12582912, + "byteOffset": 0 + }, + { + "name": "model.layers.7.feed_forward.w2.q_scale", + "shape": [ + 6144, + 512 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 6291456, + "byteOffset": 12582912 + }, + { + "name": "model.layers.7.ffn_norm.weight", + "shape": [ + 6144 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 12288, + "byteOffset": 18874368 + }, + { + "name": "model.layers.8.attention.wo.q_scale", + "shape": [ + 6144, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 2359296, + "byteOffset": 18886656 + }, + { + "name": "model.layers.8.attention.wqkv.q_scale", + "shape": [ + 8192, + 192 + ], + "dtype": "float16", + "format": "f32-to-bf16", + "nbytes": 3145728, + "byteOffset": 21245952 + } + ], + "md5sum": "4be47898516de3750155af2c09274973" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..01722807c930fe672727cab71f9123f50fe91fab --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb0459e58dece47c2eae86e89b5c9d6093f53bbc23af86d4f8cbbbafaa65bca +size 25165824 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..39042bbeb2c32d268ee841f0901aadb17fb9c306 --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed20162e3ef0a7967a153e48cbde61693174e98cab7eec3824e2159fe51cdc25 +size 100663296 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..21674bd2b80d3b45cce782a224e66ff06f7a5e51 --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce116e62e71f191ae9464a1ae4d2c148ce3b70fb1b23dd59201767cf3a76d9c7 +size 50331648 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..b62b88931772096538c8ac3644d7657f86565017 --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d8bb5e07db69f05b4959f0f4596958f7e5714e408867e12edad099329fc7b1 +size 50331648 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a9238d737f3ccdab63d9cc31e3af9e40e837235 --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de4276d4a3f42ccf399b54e2b17c76e27a5c2e2df0402247de620751f975983 +size 18874368 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ccaa20ee8594c10c4b0aaaad09fe49b997c0789 --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e33e921aee8bdb5f2186fad2b4b36b9d298d05dd88193f3ff18824cb3d7fd2a +size 25165824 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..6fdae7050aacc5880f95d1b2ac29f1f8d0116bf6 --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:430e42665ee8f1378b26fb48cf7c3a975cb05345c733a1eab0155bee1b8d4050 +size 100663296 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..a0f3bc19330ac08c1c6dacfec1ade96daa012131 --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5081ab36d448bd96924040a5d458076de979c2b64d5ddb8717c15ce5e24ff0d8 +size 24403968 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..acbb8a1799d49c29dede9b791ba1c31ad15416c9 --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32692de128ccf1ab9a0b2fbc03aa997855065f291af2f75e8e48dcc1456b2948 +size 50331648 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..9415fa77843c5daf5e1c1b9c5a2e5020b79b0b42 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27004edad5ac50c850306b8aae0ef60f89d21a70ff8084e23018108f4c67a445 +size 18874368 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..1218390124bc6d676b333a4d6eef18ca4a4f23f4 --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02750ac4f497014b655fa7cc67b35fa21b3ad3830c54457dd4bb53aae62765ff +size 25165824 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba3d7174b49e828204cee0d5e9e25582e662b372 --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0eadf592956661531deedc6f945df6d9c7a75293c4f0011b643fea2075312e7 +size 100663296 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a17c1880dfd312620abd2756c95045a6ac9e76e --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:919093fdcdfffb45242687326612590b8f0ae27a43bdae5fbaf8f2dc5bf57d7f +size 24403968 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..44f52cf82aa37cdcd684c72b9d817371a06c815b --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c932e5027e751fa3721242055cde985f41b1df5d24e2b76d6af7c8406950a86 +size 18874368 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..8865481687f72180ca93c0d4fc2c70479911c29f --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84207ce3e8c1db8bf5ead72e38588837ff1322b3da514f70475a9d4394b9c888 +size 50331648 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..99fa2bbc99a0bbe58e5c47a31c253bcb3dc6a467 --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916f1ee6527e9158ddd6005f5b639d16965fd8f894ca6e098e3d228da5d8d494 +size 18874368 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c79677f6247f4d7337372c0b16d7cd59e7a23ff --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7628d7790272d26681fd8b9fef103d0aaf7f4111254761ae44feb562ad4648d0 +size 25165824 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..5b8a55ce8af919ecfa202cc3aafbb0e7353b2978 --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a69b7f89725dc0227880d56c9324758782418254f6318c3de391a719d990da7 +size 100663296 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..c52eb368d9588a04d06e50c5204c478d260e1e00 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dbc16808b62e736080760b355cac4800f2190665a9e3ca211f43f2bf8ccc6a5 +size 24403968 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..a512f253aad25e13ff1d751cc7c2adc39af22f18 --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23f4b7cdf6f82cf74b949e0f2f5a57b4c9de98d9673ede148f3d0a5211fb48fd +size 50331648 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..080278308f5dbf5d80e22142147625995116329b --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0909bf1247336b3ada15d6888a91f6aeadedb910d83b45fb6477f348fef15bdd +size 18874368 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..7500e10894026eafede486bf8d06381f934e43b6 --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3059064d0a76be5dd9a74da7b7078e51e9c4eef2424dcc7ce2b2285fb72ed051 +size 25165824 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..7eca14da4f0e439df305930a20eb2ba87b95102e --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f5e3826ca03f5ce46440319a368c09f55ae90c05079eb38437c6775e13e950b +size 100663296 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..050e040524bcdac544d46306aa0a857880ac6cc7 --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fa1dc9f305fa4f0036deb2b425af0e98d40403bdcc13b4b58a30ea9b0eab394 +size 24391680 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..36bd0e55222f7ea279e827be4dc9b257d2d117c9 --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ab4de3a6d6accdb9825e81b41836e625cef07d55bc714cfa246d4ce42417a8 +size 25165824 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..7ab95c511d85a45a65144354343981fd66982c35 --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:226cc4f8a9b2c74e0180cb0333bf6db660d181d9c8cd02e8e2c69968e9eb7176 +size 50331648 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c227714f962a51cd63faf4f300af3558f17cede --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1ff3c496fa9a5475bec22f996c9457da4d47b47ffba2287ff44b9c098271029 +size 18874368 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..299715d7f74341556e7097584d67c4423c2ad177 --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0f25082d204d69684b07bc9a4d86c25845aa24148265f458484f2c3f303182 +size 25165824 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a6ba85d159a9396ca250e88c51ca693424b6c89 --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47e2b61c89318d9b3a850b5ced9a9166260a4bf428145b09a853dcffa44dd4fa +size 100663296 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..deca4acb77f95644f2e8422549f048dc64904ee7 --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a1c5e5082c1a4f60aad606d898fa6d82ca649f222a7275a7bab55f47cd957eb +size 24416256 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..8999491d0800d5f79c85116fd1b57861187fa720 --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c19420c27e2f2f2879782d3950d909e0ff2eff9c90ce155dcf8215054c29d319 +size 50331648 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd83f63ec433600231ce2863be2b581d15afc8bf --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b31f63e6ecb9b6e822dc4c0b11dfa10df51d0e3cddb3e535204b2d305049173 +size 18874368 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..11835c81928c1f6f8f81fe5d73dd9e53d7271f49 --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5065324e1ed81d1e169a3f8b603cfe60ad5940ebed9cd44c16be5f1db5279833 +size 25165824 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..f57f5ae8bfe50931aa0785c31c9502f9fe0f65c1 --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3174bb0732f5de52291b8bdd4309827dcefa4efc68fb69e190b34dfa9e8e93f2 +size 100663296 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..3f3647d16aa0a6fe7f9cdf616e18a476f39c84ab --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55ca1a58d23899a5c5932d0f086af7020da0cc13785f5ae5cc9075deae192695 +size 24403968 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..29a52bd16f8d8474adebe78acc9f2c18f7af19a0 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e033d99a4a19bb59e22510b5d085035a0d887e8ef08bfd34e776889c5ce42bae +size 100663296 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..196836a1d1b593229fe7e99a29da651ee80d407b --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85bbc4c55804a4d310ff540c5af694acb137058e62d16e7bccff886f1948cef1 +size 50331648 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..18a12cefe02a0eb8d4da941bd27ccb56dece6b93 --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1361fb250b07d8a03c0ecfb1a878f73ed88e96963337c2c344efdcdfaabe9921 +size 50331648 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..a8718e0e760d9f23626f59e01512ab701d89b425 --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d379b0966746c20b1ab0e42d6aa4e1360351cb1200e176ade307081739685d9c +size 18874368 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..d1166de08c7c92cef9084986b6fbc38b79b79c1c --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c40783d16b8ee678fc4149f03119157a96d6b53e480f1da4ea64466390d842 +size 25165824 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..b24e6e9deccfc842ebabaac6811e421044eb737b --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41bc0a64e2def945c9ca3c07b820e1368d1f095132732ca1de6f98880ce6c08d +size 100663296 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6bc02041407cf2e7c0b600ebebfc23a993c29f0 --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533fb1ce2f2df585a96ef18709e4c930954e9b0c34bf979a733e113761b49134 +size 30720000 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac876b05febb4eeeafe3df747f6a4c537a1e79fd --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b1d0177a822b70058573882a5002f322f1bc3ba7f105b1a2e18e06f3faa54e7 +size 50331648 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b5a24eaa1de8b7fc4fd3741b1296556c51419a5 --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005868a312d6a1e0ace755cd352cf8abc20e95c963dd9b2337c4ae14325473fe +size 18874368 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..acdcc7861362130c0df4187a73070682c9ba12b3 --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5b8b8f572c480c28d5e987a3d889612d1435f3c38b9cdbd153ec92e6541498c +size 25165824 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c59ac35b6021da4004035013bfe5c009458cebe --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfbf12fd4a949f10745c16d2455fec00c156aa6b2f02a3667ab7e6ac08a3a871 +size 100663296 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..aef1195bfd034ca244e01d3dde9c4c8a20848dbc --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:804e13ebaaeb3015c825bc79adb71b55bda6e9f25c6a92265f8a1de71c5c1c30 +size 24403968 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..e937ed4e14f01be1c904da892fce7fab6eb3928b --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59629f07d9bfd19b95165a57709a2784b97b59a547dfb69d9c091f6c51897dc +size 24403968 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..63cff365e636392ddd0a8effe129c469a6284490 --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69eea7bdc01321dabdfe30ebe296eafa59090ed2aaed7ac89527a5c61dcedc34 +size 50331648 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..c8b4f616e6a190890eec96f448b8073ffb43a8ee --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7582d42f80b706d7c426734f4a4ad96dac05bb14ec0d084150fbf529a00b979 +size 18874368 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..917091ef8cab605128a27d836841315db205ad2b --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e4f1c823deed632ca41b889308f307e69ffd5d6606081928c97c9ade805fd15 +size 25165824 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..ded1c64a45e4c8767fdfb19eb1d19d400146bdbd --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:705c2ccb1c85726602deb696ce0d33f7b68af75248be941044f18ad9f717e9ef +size 100663296 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..f0219859216925bb2843fbc374b1d617da87738f --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce0a93b2546f74bcd315c5957da56f1e7c598405e2da015532bfcd6237b9e68b +size 24403968 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..de0bf4f03d99a19f7bce542d46cd71cb90d8e84c --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f7bfff29a63994c5899c947b64505a5864d9e2f2cfa10e88e8c8497cda6f4a2 +size 50331648 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..a068d9936356d7988c0582b6b36790f0ebbaa295 --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ccf8545d85b235b9a8f84e977f44b13a499fa80038cc985adb4715dccb3cbb +size 18874368 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..f09a5f8b42bad5b06b03fe2eb8adb8837ee9d529 --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e693e07aa48164b4a929951532e904ec67dda0423da8f3cb3a9222eb1e778a +size 25165824 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb283eb4a2a7b60991d6f95fb1c75e15a4460edf --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00ca47f59a0c0c424b44fde92b1ffad1c7f6b6041673286db0f0edb5088e98e4 +size 100663296 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..6df279487f2b71c93f524217ec7a8e0529f77a8f --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fbc1d55a90070de1a1d3064dbf22e48fd3c2de5fe32157778a86143e1754eb +size 50331648 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..2ab5f4626f23103a819f5770234ea7172dc16af6 --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7296b5b4dcfc05304ad8ca47f41fa8d2b55bd7a441bde09ca37f509bce99d754 +size 24403968 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..412f5e218343a45629f04c739bb1edf8413bec86 --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be12be1775b56d833a54ba7347dc5413708a24190f22688e12768098a2786d1 +size 50331648 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..76fabf0aa2e981289d3ac11da96cd93babdf8cc9 --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6f1bddd7a6eb2c75b8bd92d32a82506f05771c20478b326b8a54e75826bb0cc +size 18874368 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..32740f73170708b5216e3c4081f42361d4e027dd --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:998aa9ad5b1b7d095dfc0e557748991f931312775a8a74c5e23e6425411e8652 +size 25165824 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..71e2e02a57466e6a405e84e86640c7f218c10456 --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4b8587bb27539d5477c94faedbfe63d99ac8a02f21d7240a579753dd9b69d2c +size 100663296 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b5fa02bd384be6ac47008c91d11600966e6f575 --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9427ff8262e1dcadcf2731e7fd269fb742f33f8eb44af98f717cc37a27075e +size 24391680 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..7de0b8de97a005f4892a1662b5ce295082609119 --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f977e35e979990508707756a6b266a9d8bccf0a22ecd7b7d9ee4e2a6b94fb02 +size 50331648 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..76f36d41c446d54d569b84fd98c62316dfd24bc1 --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34480045ba2c4af7658f88fff564150b97dbea41f6251d57a94e0e6bd8632b0c +size 18874368 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..14d4667b7263cc5ed1a70026c0edbd2e46fbcd78 --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22eff38864259e453fa65f79d37e03c227e71732d021e4b643847aed90548d8e +size 25165824 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..423406659df003ef0415acbf555968be0b38a966 --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9cb41dd3d81d62769cb6b123c05ad3449423b63df2818d21d1e91837bb5a5f9 +size 100663296 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad80f03ae386dc7238463d08d67086f88c775505 --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5211e53f8ee4db9dcd6268fcf48b3328e6b70ea92918ede635b9237afabb6d4d +size 18874368 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a7c89d1f92dd09118b0d6448454e7ff6c7ec974 --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b132219562a78f09f8afffac00505ed06a893eefbbf34e3d8c1c4cf34a59abd +size 24416256 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..065339f1dded5fb98b0849f9b91bb925ddb8981b --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e0857c1393335e288b4258ec66b0f5c78bf84789a8b217539f4408c10601cd7 +size 50331648 diff --git a/params_shard_162.bin b/params_shard_162.bin new file mode 100644 index 0000000000000000000000000000000000000000..367a817acbbcbefbd3684289e18ba29cad8532f5 --- /dev/null +++ b/params_shard_162.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f2f61a16c356119f9b0f56834cdf75dfa6feda91c9d9e3b6ac070586c0da195 +size 18874368 diff --git a/params_shard_163.bin b/params_shard_163.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4d8f39f38161db049f5dbffe3c60f8adf911a2f --- /dev/null +++ b/params_shard_163.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c38ed31361be35cabaeb0382335ed08fe49b50a29b5145dc74ecc02e27806b1e +size 25165824 diff --git a/params_shard_164.bin b/params_shard_164.bin new file mode 100644 index 0000000000000000000000000000000000000000..e143dc744d61bbcae3b5c59eb50a9991129e671e --- /dev/null +++ b/params_shard_164.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b88ad61c441a369d3e66ecf822880ee65eca580d21e0c086414216c9fbf96f9 +size 100663296 diff --git a/params_shard_165.bin b/params_shard_165.bin new file mode 100644 index 0000000000000000000000000000000000000000..82d7eb9519857beca8bc0013965a2a45d4e6aa64 --- /dev/null +++ b/params_shard_165.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13597da972aa034a745b7afd2de7bfb4ba71aa44d35f4c998b7b634435df78d +size 24403968 diff --git a/params_shard_166.bin b/params_shard_166.bin new file mode 100644 index 0000000000000000000000000000000000000000..160afdb49dd92ff4efac45a5fb6e595805e4eec2 --- /dev/null +++ b/params_shard_166.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1aa75f08ca3854fa97693fcfe1de787eace7841f3cfeac1dc57f671dcf4978 +size 50331648 diff --git a/params_shard_167.bin b/params_shard_167.bin new file mode 100644 index 0000000000000000000000000000000000000000..09fe1fe78e47ed54034dae562030e06c25ef5594 --- /dev/null +++ b/params_shard_167.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f54c74f0c6855ddbf45e9d7e358d46f1a155b8ee2c3817614120aa57e92735c2 +size 18874368 diff --git a/params_shard_168.bin b/params_shard_168.bin new file mode 100644 index 0000000000000000000000000000000000000000..d9db6f6c1a872fe70228bf9de6ce8eac79dae3b9 --- /dev/null +++ b/params_shard_168.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98b213ed5d5dbd35d78fad8a450fa885c8ae5e1333d9a3d933430b2c1930c33 +size 25165824 diff --git a/params_shard_169.bin b/params_shard_169.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b16129e32c5fa641bc332568ecf89266697ebd5 --- /dev/null +++ b/params_shard_169.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c4d5641a1a5463e2e135cf90cc470bdcffa7e5a1f392c48fb9d847ebab3add7 +size 100663296 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..dfb70a169ab85acdb879990e1855113d09a09cd6 --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dbcd449798e222f8877ca019ab1db4ddff6d23fc868cc9bfae85486e3a9f089 +size 25165824 diff --git a/params_shard_170.bin b/params_shard_170.bin new file mode 100644 index 0000000000000000000000000000000000000000..00f16b6ffeb0339b49133f4fb4d503f1ecc00a22 --- /dev/null +++ b/params_shard_170.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66787413a1ce72e88b871201cd6d26833df186d742d9a9813249cd3d4b32750b +size 24403968 diff --git a/params_shard_171.bin b/params_shard_171.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c23503c64484413d88e3b8359fb7ee0456a5d72 --- /dev/null +++ b/params_shard_171.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8263cafa082e63e114dc58d0e111db1db9702bc086f41fa43109668f17989cbd +size 50331648 diff --git a/params_shard_172.bin b/params_shard_172.bin new file mode 100644 index 0000000000000000000000000000000000000000..25a0a5464a18e394bfe4ecc61e7adf071c5916c1 --- /dev/null +++ b/params_shard_172.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16ec86f3bf226b2e76de079edcec5a7fbf8ecfa41133cd4f6893fcb82059599 +size 18874368 diff --git a/params_shard_173.bin b/params_shard_173.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd2c2a64f9411e7d6586d74fb3eab408ae0ccb8c --- /dev/null +++ b/params_shard_173.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2a215d18ca548613304673e00e1c0aca4de1248a69d387935eabab85983a298 +size 25165824 diff --git a/params_shard_174.bin b/params_shard_174.bin new file mode 100644 index 0000000000000000000000000000000000000000..20734b6b36035ac059a276b0a7850f0a8504ce15 --- /dev/null +++ b/params_shard_174.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860ac7b299a81f109a2953b25afcf16883c966d9b748a737901c10f7d16f4f1d +size 100663296 diff --git a/params_shard_175.bin b/params_shard_175.bin new file mode 100644 index 0000000000000000000000000000000000000000..b67188fae2900ff679f841b2cab50e897ed3e602 --- /dev/null +++ b/params_shard_175.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79c0b32f7f3dd8d9e8442751e539c2218d921445325c3e15da939b0a0d6dd269 +size 24403968 diff --git a/params_shard_176.bin b/params_shard_176.bin new file mode 100644 index 0000000000000000000000000000000000000000..b65b603f3be2b4898d6db7085fc097e7d3bc9121 --- /dev/null +++ b/params_shard_176.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b5563cb4e3e954be17c79ef899e2938ebf1b12824ff66e18372ca534d16603 +size 50331648 diff --git a/params_shard_177.bin b/params_shard_177.bin new file mode 100644 index 0000000000000000000000000000000000000000..905d455079d08ca41636951964d2fb68941f46a2 --- /dev/null +++ b/params_shard_177.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded56721b3f51d41c66460659602746a1942304efc76528362c3dd134257becf +size 18874368 diff --git a/params_shard_178.bin b/params_shard_178.bin new file mode 100644 index 0000000000000000000000000000000000000000..0494453aa827c005bd23302a126fb17d620da560 --- /dev/null +++ b/params_shard_178.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d17b98d5ac91f8c57705ae79062224055e0229de8c640c580a0305522999dd62 +size 25165824 diff --git a/params_shard_179.bin b/params_shard_179.bin new file mode 100644 index 0000000000000000000000000000000000000000..fb015eefca496cbff24067fafc5061bc93c9bf0b --- /dev/null +++ b/params_shard_179.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a572613a335f1c6ef553b3f3c9f36857acef63185366d6e811a09147f2ec523e +size 100663296 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..e0108d92c9dd0fc262cf70419071ae9d804d1e6d --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bbf7a285fc4b82e0995a618fb125f94d3b899373d1f1178b754e7c0365b2471 +size 100663296 diff --git a/params_shard_180.bin b/params_shard_180.bin new file mode 100644 index 0000000000000000000000000000000000000000..ad496fae31596b4ef637a98f7541e6f0245b090c --- /dev/null +++ b/params_shard_180.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7efc51751e3090a3ad2f58ff8f9a8b59daf805a99af91c3730f83c753b9d4c8 +size 24391680 diff --git a/params_shard_181.bin b/params_shard_181.bin new file mode 100644 index 0000000000000000000000000000000000000000..c8cff343f25b6e49e00df285840451ad1f936ecd --- /dev/null +++ b/params_shard_181.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3eb82d04602f42fba5e519e1da83dfa9606fae09439ce6c1adeacbe5d065073 +size 50331648 diff --git a/params_shard_182.bin b/params_shard_182.bin new file mode 100644 index 0000000000000000000000000000000000000000..6f5e1cbf209f09130d2e2130575f54c96cc57bc5 --- /dev/null +++ b/params_shard_182.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef7b46608e199d82621dc9707bf00af8cf8f7dd23e7533e988c49f316224af14 +size 18874368 diff --git a/params_shard_183.bin b/params_shard_183.bin new file mode 100644 index 0000000000000000000000000000000000000000..1a1be91bc1339f3161514fef4ba9fb60a8a74b28 --- /dev/null +++ b/params_shard_183.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:579e93cf45e136618aa19919c8d6fd1ee78d00eb48b38cdccefb5ad113749d32 +size 25165824 diff --git a/params_shard_184.bin b/params_shard_184.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a69746e9f46fe05abd91f0c43955313801bd1ea --- /dev/null +++ b/params_shard_184.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d962aeb49ab4610e473e9a86302865d309c6641ab05d72134575c6cdd311da +size 100663296 diff --git a/params_shard_185.bin b/params_shard_185.bin new file mode 100644 index 0000000000000000000000000000000000000000..3910e68b6528e1ecb90c3887f244c8f5d30569e7 --- /dev/null +++ b/params_shard_185.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b04cdc2d45719538e9ae411d06170e9cd3854ac0837e2bb09491e4521c975b2 +size 24416256 diff --git a/params_shard_186.bin b/params_shard_186.bin new file mode 100644 index 0000000000000000000000000000000000000000..56ccfd959a3a1d53e9f3202cabe678cf428babba --- /dev/null +++ b/params_shard_186.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0babcec18fa657e51cfaf04c9014a5cb095cd189cc77143a118797112d2734b3 +size 50331648 diff --git a/params_shard_187.bin b/params_shard_187.bin new file mode 100644 index 0000000000000000000000000000000000000000..609520d6c76f8eef9bc117dcc68a2d3608195d43 --- /dev/null +++ b/params_shard_187.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6b4bdfcea581002f60af713b339476d0f808b34a7016e7f6df7a97599e0dc9 +size 18874368 diff --git a/params_shard_188.bin b/params_shard_188.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c883ae5f0360bd6fb9c8621cd34cbfb94dc158e --- /dev/null +++ b/params_shard_188.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d4a1cae445775058acfd61c11df90c8174b3361cbf1192990ad6ca8ddedcdec +size 25165824 diff --git a/params_shard_189.bin b/params_shard_189.bin new file mode 100644 index 0000000000000000000000000000000000000000..7681f6520c0ea8adec6c160eabe3d14a3971e97c --- /dev/null +++ b/params_shard_189.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d29b236b95b480cb060a29a43b819f6f97e6be0723e79e49adaf3eb8ded8f141 +size 100663296 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e65086db9a95ea37930666958a0cf1e51aebdd9 --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd9a0c00fc256cb59eaff313340ceaa127fed18f09e7a5c5369c778b85d62fe9 +size 24391680 diff --git a/params_shard_190.bin b/params_shard_190.bin new file mode 100644 index 0000000000000000000000000000000000000000..e554b91d64c199a602536253443bc1da4a10a729 --- /dev/null +++ b/params_shard_190.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5b29ad11640d8e742ca533d8dd0fc5c3d7bec67c93cbbe4e3537a22662a696b +size 24403968 diff --git a/params_shard_191.bin b/params_shard_191.bin new file mode 100644 index 0000000000000000000000000000000000000000..511fbbdc3cf20f4b4dae95b12425d3ff506aaf3c --- /dev/null +++ b/params_shard_191.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16704de327723cf5942051684c13796662f454f8759db7c37682ba0ada3e1f3f +size 50331648 diff --git a/params_shard_192.bin b/params_shard_192.bin new file mode 100644 index 0000000000000000000000000000000000000000..a22b5985d24d27d9eac656a67c05a164c57d76b0 --- /dev/null +++ b/params_shard_192.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a44eec01b4a8638b41f2a3bf31816081031463d4a6e0c713cb783cda1c50e46d +size 18874368 diff --git a/params_shard_193.bin b/params_shard_193.bin new file mode 100644 index 0000000000000000000000000000000000000000..636c50b19b3520d847ec759903406d9cd0180867 --- /dev/null +++ b/params_shard_193.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62960b76a9af5f849325106987710051ddaa734ed95d36f31034f5a83d72b773 +size 25165824 diff --git a/params_shard_194.bin b/params_shard_194.bin new file mode 100644 index 0000000000000000000000000000000000000000..cd3a23bd7b7619ee3aa4d6bbf3b63b1ac078bafb --- /dev/null +++ b/params_shard_194.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc6c61434c551365e8d968cd164d3d6fbefe1c0f598dfdd55a01cea7c8cba9f +size 100663296 diff --git a/params_shard_195.bin b/params_shard_195.bin new file mode 100644 index 0000000000000000000000000000000000000000..8837f4a12c42fa795dc961fbc921d87fc4105fb2 --- /dev/null +++ b/params_shard_195.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fda65e0483b614f1b059dd4b065e7cf547303470497650d0d6ec02e8b1b3438 +size 24403968 diff --git a/params_shard_196.bin b/params_shard_196.bin new file mode 100644 index 0000000000000000000000000000000000000000..f06b97cffcfdea1586e1b6d85dbb2f4d35312250 --- /dev/null +++ b/params_shard_196.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b0a970fa3fe98f97621ea046b0cd91bd1483912593a470bfa564ebfea6bddf +size 50331648 diff --git a/params_shard_197.bin b/params_shard_197.bin new file mode 100644 index 0000000000000000000000000000000000000000..baa679ee54e5da6c413fafbf780a1cebd96fca99 --- /dev/null +++ b/params_shard_197.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3afb2e2c338b3472878b62ca6d61bf58f9ce650712413adff6e13a8be6b6608 +size 18874368 diff --git a/params_shard_198.bin b/params_shard_198.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf47cd72dc49d94cbdecf42211b26d72f4121529 --- /dev/null +++ b/params_shard_198.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bea2876b2ae5c14aafbefe510c68f71e7d774c72d73e3565ba8b6abe8c29699 +size 25165824 diff --git a/params_shard_199.bin b/params_shard_199.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7289e0ff8b1258856032620d1384929ca9d93f6 --- /dev/null +++ b/params_shard_199.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a70097128809b0f426bb0b6928d69a745cf6396c6cbfd938a54ed25d4c641cb +size 100663296 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..055d86e0def985e656d6253002f0d59a5da9318a --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af07edbfe5dedecada880efa0c29d1df3216e9c5c6747b9f51196322f49ffaa +size 24391680 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..3a31c491958ea23e6b51666e060827406b0508dc --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51573eb3ae66a78da20a6d64d0a4e400f8ab1971e8dd743763855e893c5aed6d +size 31457280 diff --git a/params_shard_200.bin b/params_shard_200.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c5d14e471d5d9990d93243eb5d30e415c92183b --- /dev/null +++ b/params_shard_200.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c8c7fd8d6d78e3860279ed933e7ddb44fef2a813f1b5ee3f7a69a1861ccbe74 +size 24403968 diff --git a/params_shard_201.bin b/params_shard_201.bin new file mode 100644 index 0000000000000000000000000000000000000000..0fc4aa4001eb46a3ef5534bb0cf389bead191aef --- /dev/null +++ b/params_shard_201.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5625ef7fdd6955047b302fb7b0cd9b14e114bc3c2bfa07e4b5503217f1dd1106 +size 50331648 diff --git a/params_shard_202.bin b/params_shard_202.bin new file mode 100644 index 0000000000000000000000000000000000000000..a991c7e70b26e2d39b256db67434c688fe76ef10 --- /dev/null +++ b/params_shard_202.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1332e059138c746d0a654389b8b1d7997baf80dd0df12f5417d603f9b84b415 +size 18874368 diff --git a/params_shard_203.bin b/params_shard_203.bin new file mode 100644 index 0000000000000000000000000000000000000000..75135f58cd1306a91789b644c227b78f0e6dc5f4 --- /dev/null +++ b/params_shard_203.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ca548f82d04fc5976991cfc2916b7f716c7e7d3dea1fd9e5014114d255da727 +size 25165824 diff --git a/params_shard_204.bin b/params_shard_204.bin new file mode 100644 index 0000000000000000000000000000000000000000..5508d193677dc9ca276c05303af18c1c45314866 --- /dev/null +++ b/params_shard_204.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69ff8789b770589319de7e8d3ef930c72a75ec6431984d1d755fea33cf29719a +size 100663296 diff --git a/params_shard_205.bin b/params_shard_205.bin new file mode 100644 index 0000000000000000000000000000000000000000..31eb266a5aed6a8b46fd78cd19142ca44719d74f --- /dev/null +++ b/params_shard_205.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e323d7230ac0b3480d4060d468f9ec352b483221844fa268c3db967c52184716 +size 24391680 diff --git a/params_shard_206.bin b/params_shard_206.bin new file mode 100644 index 0000000000000000000000000000000000000000..d110ac3e526e3759f8b4c6ffaaafa8711f9279b8 --- /dev/null +++ b/params_shard_206.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6624482dcb4594da49bc89af2c58256bae7536d66aaec65266c5200c27c9c262 +size 50331648 diff --git a/params_shard_207.bin b/params_shard_207.bin new file mode 100644 index 0000000000000000000000000000000000000000..2812a2264300cc15aa0062447448974214611b64 --- /dev/null +++ b/params_shard_207.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b6300adb5c86515d35a255ff27a2568cd34a6b143dbe7e2c5d86a48ca8618f1 +size 18874368 diff --git a/params_shard_208.bin b/params_shard_208.bin new file mode 100644 index 0000000000000000000000000000000000000000..93944770afeb835d9030b2e30a5fbbce8b9d276b --- /dev/null +++ b/params_shard_208.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6076b71722db0defb683fe1fb85ed5f338566215b0d447589a5f7aef98ee2f4 +size 25165824 diff --git a/params_shard_209.bin b/params_shard_209.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ecade66d370852ac41a3fac3a2a56297b5df288 --- /dev/null +++ b/params_shard_209.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e8ab762da83e24b16478a71028a6afe29086544166f5d23be5fb9cbee73c5ff +size 100663296 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..541c8c298bb870043d573d75d35619fd5504234f --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf9b10f793380b6df5e6c496af780419d9713be3f01dc9676bff68ed87c89f3 +size 100663296 diff --git a/params_shard_210.bin b/params_shard_210.bin new file mode 100644 index 0000000000000000000000000000000000000000..40d827e379d2accc71906dfa79bdae475ace8fd1 --- /dev/null +++ b/params_shard_210.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14755dff44131d0fa46515ed00a1149a6f67b5e7a1d8b951c0b53ca8f4c9a33 +size 24416256 diff --git a/params_shard_211.bin b/params_shard_211.bin new file mode 100644 index 0000000000000000000000000000000000000000..fc737cf7517d32aa04349b4b54877351f9360f4e --- /dev/null +++ b/params_shard_211.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8b6849c173eeefc8c8e1ce2f9820edad216f05db075c93a443215ffc806deb +size 50331648 diff --git a/params_shard_212.bin b/params_shard_212.bin new file mode 100644 index 0000000000000000000000000000000000000000..3375657c50f160df4241cf9f32faa83403ede665 --- /dev/null +++ b/params_shard_212.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4ebd36240476fae927b48bcdfda9db524d26464b3e61edf41ee463fccce7d2 +size 18874368 diff --git a/params_shard_213.bin b/params_shard_213.bin new file mode 100644 index 0000000000000000000000000000000000000000..98668b81ec2426a1b7fc43553644bd15b1ce3c88 --- /dev/null +++ b/params_shard_213.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149c6cf83aec5335591143f900f4819f71199c6568b1306affd42ca6c87f6ebe +size 25165824 diff --git a/params_shard_214.bin b/params_shard_214.bin new file mode 100644 index 0000000000000000000000000000000000000000..766648ea91a59a86fa3c35cb2f6744c58f8aa4dc --- /dev/null +++ b/params_shard_214.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fa0350db8ed14890cee15ba40fd8d862d11d57753fb3643e021e18ba0934f8 +size 100663296 diff --git a/params_shard_215.bin b/params_shard_215.bin new file mode 100644 index 0000000000000000000000000000000000000000..27fd39296fade6fe444dff9efe3130610ebad473 --- /dev/null +++ b/params_shard_215.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2291597649a87c1d5273d24da127155e18d3f48089b41b8daa555373002c17aa +size 24403968 diff --git a/params_shard_216.bin b/params_shard_216.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c5b7d7ffc749b154dd3c00c264abb69e15c481c --- /dev/null +++ b/params_shard_216.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35c1127ee7d2c65539b8f4db763efbd3e464e61b394d5354c7290c6e729c83ad +size 50331648 diff --git a/params_shard_217.bin b/params_shard_217.bin new file mode 100644 index 0000000000000000000000000000000000000000..162486cfaf39643334d1c08b1a449e58fda288d6 --- /dev/null +++ b/params_shard_217.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32587005965f583f51c0ed308cf5aba53f69a60dd74c4508277b692b4ba31e2 +size 18874368 diff --git a/params_shard_218.bin b/params_shard_218.bin new file mode 100644 index 0000000000000000000000000000000000000000..004104fbd5074951f9eb37e9d492bfb5f0829d6f --- /dev/null +++ b/params_shard_218.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f922ea49e375907bb2b5b8842206b22520c9cc8027be9e1df7afb2c913e1ab +size 25165824 diff --git a/params_shard_219.bin b/params_shard_219.bin new file mode 100644 index 0000000000000000000000000000000000000000..721803e68e0c059098586607a0d7ceef8b20d889 --- /dev/null +++ b/params_shard_219.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31ca48c669f5a46d74e9f81de05ad31825f76975dfbbe5ed173701d8a8993d4b +size 100663296 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e6d009efb7df6f773d746c5d4e0848eef883275 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aaab9e1aa1f3c4c106cf58308ba4529148f1d0d850f9ab018f7ab81970e5cca6 +size 30683136 diff --git a/params_shard_220.bin b/params_shard_220.bin new file mode 100644 index 0000000000000000000000000000000000000000..df415ab8f162f171027d2f98541ae0bfa4566b78 --- /dev/null +++ b/params_shard_220.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c4d7afc95a4aec4548e304ed06146d4c19dd94653a0273cd70375e8a6991c6 +size 24403968 diff --git a/params_shard_221.bin b/params_shard_221.bin new file mode 100644 index 0000000000000000000000000000000000000000..d783cabd2c41e415d05c0eeb25a00f4af408a9a4 --- /dev/null +++ b/params_shard_221.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11d06890f2a3606090a7977963958d86b80da3f5992529d8290e784f2d15a5e +size 50331648 diff --git a/params_shard_222.bin b/params_shard_222.bin new file mode 100644 index 0000000000000000000000000000000000000000..6849e87d249106bf59b05336e5e2fc42ecf5bf6a --- /dev/null +++ b/params_shard_222.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55743cd2c3c3fb2c388a4cba73b2567aa859bc8031ce07592123a09ec8071fa6 +size 18874368 diff --git a/params_shard_223.bin b/params_shard_223.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab0e3f2f11489440d662d05a337f5aae220b42a1 --- /dev/null +++ b/params_shard_223.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e0e3b8fcdb6228ec0efef6aa65e0bc05eae59164d1d77d3f38cb85b52a03fa +size 25165824 diff --git a/params_shard_224.bin b/params_shard_224.bin new file mode 100644 index 0000000000000000000000000000000000000000..c4071c4e48d17e0a8db6d0ad03ca97a4f654c503 --- /dev/null +++ b/params_shard_224.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd1b18d31b36681a56fe00f8fcfdc08055b1f36abf14dfabffa97716f6732b7 +size 100663296 diff --git a/params_shard_225.bin b/params_shard_225.bin new file mode 100644 index 0000000000000000000000000000000000000000..232536c7e84f5455eba73d950b61395b6a6c3ad6 --- /dev/null +++ b/params_shard_225.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69ba0f92e0bcf42720e58efa33de842b184b098cf26bdea3a207f9410c669f98 +size 24403968 diff --git a/params_shard_226.bin b/params_shard_226.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4d255186fae38c7f83c6f6535d0ad030689029b --- /dev/null +++ b/params_shard_226.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb2b4333eb723829296bcf6ead8f77b22dc4aefbe7d4a3ea1f0f7ad048ddf56 +size 50331648 diff --git a/params_shard_227.bin b/params_shard_227.bin new file mode 100644 index 0000000000000000000000000000000000000000..7f02504102423c1c2b9257711255cf28791b4e1e --- /dev/null +++ b/params_shard_227.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8295fff7e523b063178353e112262f23025c7dc8d57e2e7be7495aa1210654f +size 18874368 diff --git a/params_shard_228.bin b/params_shard_228.bin new file mode 100644 index 0000000000000000000000000000000000000000..f56ffd7323946b99292f00fb05e256b0fbc6f39d --- /dev/null +++ b/params_shard_228.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08220df4bf3bc1b25667047422d3d690238ac5c32a3102a7777685c825a33bf6 +size 25165824 diff --git a/params_shard_229.bin b/params_shard_229.bin new file mode 100644 index 0000000000000000000000000000000000000000..14c117fee6e13273a6e601769e1651859efc1710 --- /dev/null +++ b/params_shard_229.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8361a55c1ff1ddb5dc4cd5cf9ddd282252ea1e6488ef62f7e70821e265fc40ac +size 100663296 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd699db77070b02a948491cc8c0403bd72c2b0a3 --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:addc4614b98d2d366923a1e2df115b7068d2773922dbe3dc88eff3cf03c38600 +size 50331648 diff --git a/params_shard_230.bin b/params_shard_230.bin new file mode 100644 index 0000000000000000000000000000000000000000..f6296db5674a14a5cb05faccc8fa5e9b7d45e52c --- /dev/null +++ b/params_shard_230.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e9c20de9fe291f8aae75958fa073bbf4f26ad95cf45581f6206e1aba197e155 +size 24416256 diff --git a/params_shard_231.bin b/params_shard_231.bin new file mode 100644 index 0000000000000000000000000000000000000000..b890223442b267e6c1e0064d541ba64c3f5622d7 --- /dev/null +++ b/params_shard_231.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a0bd9404fb14b4bcb23c3e690676988cf5d9930f180144dcf909dcea31a9e49 +size 50331648 diff --git a/params_shard_232.bin b/params_shard_232.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d9f7ece838abf1a7515b0d53171a15f3589d1e5 --- /dev/null +++ b/params_shard_232.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c645c0a79b360ae8c34f50b21c63e7261a73a0093e51b8c3c5cd868999dfbcbf +size 18874368 diff --git a/params_shard_233.bin b/params_shard_233.bin new file mode 100644 index 0000000000000000000000000000000000000000..78f1caa6890202237b3edc86e6bccdd082f8fef6 --- /dev/null +++ b/params_shard_233.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8cb81780aeeec36afe7fd09ee6203de6fd46c762cf216c057cfb09206717f1f +size 25165824 diff --git a/params_shard_234.bin b/params_shard_234.bin new file mode 100644 index 0000000000000000000000000000000000000000..880d0ae2ec9702e1f00dd72f049cf862a24c2790 --- /dev/null +++ b/params_shard_234.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e7b5d859fb0d5ed2cf2a642751eb76a025ccc4961a166140e967ccd2c508b93 +size 100663296 diff --git a/params_shard_235.bin b/params_shard_235.bin new file mode 100644 index 0000000000000000000000000000000000000000..02863ff8a1722c13993be4cb36edcab271161043 --- /dev/null +++ b/params_shard_235.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e707f9cc17cb4ef233e88fd13b7ccc5a23d5f95fa0a425eafa141ece839ffde6 +size 24403968 diff --git a/params_shard_236.bin b/params_shard_236.bin new file mode 100644 index 0000000000000000000000000000000000000000..89220a07cb4373f99eed4bcd16c553960703ad5c --- /dev/null +++ b/params_shard_236.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be17d94873a6f37692f223c0d09ac04983e539397c12f0ddb714802e78ef6f9 +size 50331648 diff --git a/params_shard_237.bin b/params_shard_237.bin new file mode 100644 index 0000000000000000000000000000000000000000..d318a0b6a5a8c0cb50fed5ceb98ab32b7725e305 --- /dev/null +++ b/params_shard_237.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be1f01497b0c8eccf6e1e5d16ee949393c10ba277261ddefeb6c44f7dfa4191 +size 18874368 diff --git a/params_shard_238.bin b/params_shard_238.bin new file mode 100644 index 0000000000000000000000000000000000000000..591913881dffcda24577229d5feab1907be3f0c7 --- /dev/null +++ b/params_shard_238.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b7d3ce5efa217ada44e95032f05fbc51d26e4ba517a1a04721e15e41f56bb0a +size 25165824 diff --git a/params_shard_239.bin b/params_shard_239.bin new file mode 100644 index 0000000000000000000000000000000000000000..c438bc113c0fbdc4a4facf8c17d902a4b174bd5b --- /dev/null +++ b/params_shard_239.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:435cf3d7e9522e76407b9f03ce5ad1f337bdcbb78dae515029fa9d3878d8081e +size 284295168 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..c9326f6235d4683ba0ec8348cf0f2176dd0ecf3f --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9999783424ce9df95c1b8b919657fca12e5da1499b43e3ded4ac8261d28ce385 +size 50331648 diff --git a/params_shard_240.bin b/params_shard_240.bin new file mode 100644 index 0000000000000000000000000000000000000000..d2cb798b408688ffaace892de4a5aa19e54721d9 --- /dev/null +++ b/params_shard_240.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:691f05eff0dd37a06fede44f1c09fc99a74dbc6ef1e63e15e2901a564e076bf1 +size 35536896 diff --git a/params_shard_241.bin b/params_shard_241.bin new file mode 100644 index 0000000000000000000000000000000000000000..e1e45573fa2105c153fa6c1f4e04d9c1e7e3f17b --- /dev/null +++ b/params_shard_241.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ff218caa8c0c812f90ddcf50b9d00ecc2dc2383818e2575cb4ee8a1844026b +size 24391680 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..245b56f572f00214120150550c7a4772d87b71ce --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6423d72765c75b95f2a6d3e605d381e6df1aafa1c98c1d0eba17ae060df1f55 +size 100663296 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa3e6b40402778a0e71a9c8d16f999dc8d234b90 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:addb1c05e5de944b6680904de10a3d1e84ed50e85f92f6c19c067b3665d59c5d +size 25190400 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..f5f2ea45fdadc0e95a580af284f928c1ad12af85 --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e752303c1b7fc6e57e5f4e46a13dec09141ddf03eb092070f5dd696126403386 +size 31469568 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0f816636cb6cdabe3215cc47bf0e76a2aea70b1 --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844ddb97555c6d86a9a401884e7292035d1843a3b1478e83a4b2d080c6f56599 +size 100663296 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..4caab79b3fdf9e1ab8699ce26eb09510662be042 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4263d388738f86431b5b6da99f8577aa034c2ea90754b05f5ebb3cc0586a103 +size 30683136 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..a04aef595df4f6f4473dd2e0391b7bb969a3ef13 --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51adf07ea66268de765211731c1d3b09596b2093ff90bc3917d78a0932dee6f9 +size 50331648 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..ba20ce91446c7dcf197bcb3598d9b4a3216652bb --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14416637cf54252d9bdc5eb5e758868567ac907ac648f6f84768b802d42f2263 +size 50331648 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..f30d2fcc6c50b2191eb12f5ce70c36801276664b --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0a246648d37ee264263b9ab378d8a2094f5570edad037d600a30d5e9ecf3200 +size 18874368 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..893ab829cdb5c53a37f5eead2d3105fb1bc2bace --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b17435e9cf5e6a89d120c558931003a4a037a0281c0cf27ddb6df8ff18897ba +size 25165824 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..400811313c012425b7952415860e58ae1690119d --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad725f4ec810e09193f4c4e30333e8fb8c585655329b423515dbc22043111ef +size 100663296 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..99bc5e67bf97c28101832e38ab244a16d5ce0fd7 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6d6240678332c5d45b069c8b60187894aba0f2d73d9aec436d2f6097d0d8699 +size 24403968 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..f07bc96afcfd939e69444bfdb233d9ecac70fa35 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:231040b1e3299acf843c58a1fb2ebc2f19544c46a6c8239609bdeaa60ae219d1 +size 50331648 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..c5ee0b8c686519af94d3f4c6513755fd8f86a526 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e77cf718a7c89191a40b92cc2bfe9211bdea409030da3982293b7d3d62bd7bd2 +size 18874368 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..a48bd5bc6f18f9fbc0149ad3a110f635b128cc79 --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c5cef25f2df3ac81ce2ef4b99ebf4ca6ae1829eb535195024b15748f22f7850 +size 25165824 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..f07997b3e2dd3656e045b99c6222c27f325429d3 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d12cbfb5adbd6df8b24bbcac995075f292883b65d85e545bd38aa5f1c74e4407 +size 100663296 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..b995d8a64074cc5eabf0db0805e9a17d9fd03b7f --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:665e0e5d1b7af259a28066837d9a71aa8a639f770f46fa3f6e7fc8334c3ac41c +size 24403968 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..5cca0c6c1597ff3c695e6575efd0791bcc1e54f7 --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeec58b696da1ae77a8ac4e1dc7e96362e6a807d7f88fa331da5f087a1fbf31f +size 284295168 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..571ac30d924809e05cba2e32b2d005c074ec5f79 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e9ca340df06bfefb5e6b0ec10c27a4262a98bf112d8309924633f7968f284b +size 50331648 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..674731bed333c9a17e4d34c4d4d63d33b097dbf8 --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c311a9843cf03aafbf67bac6b4657c5458577b38ba72b3449603c563de95793 +size 18874368 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..dbf62965afc9148dd5cae69aebc38a1ecec2678c --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf6a9699640be0456399fd5e7666395cedf4cabd7d65faf21c5545e3514cf10 +size 25165824 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..f223161bb60dd64ba692a7ce16ee32f4ddcb215c --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9e3fd899b0ad133f6a18195d68f2ec8522bca37340f6a7f85348d840077fe82 +size 100663296 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e8f549abe995114666dadbff8b481e6cde92e8c --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c656a4f4b58430574faaa82521321f8a5a97510543e22fdaec1140814b84460d +size 24391680 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..c659f02dd885809985473f2d3da58a92b05023df --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d62647c386b58b58b9655c43f3860a6a431788b498abafa9b0f0fb70e27841 +size 50331648 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..8a908e81a2349c49f04f1c6110d67abe10f6ec82 --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27df742b93d22ec12d9f295b397db5552147d0e808ffc702fbe47d002761133c +size 18874368 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..306443b6401e8699a27f39dfa23a2ed0dd2cd055 --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6464da3693560974057d06e81474df7b831a66cd692bb93246f5d8fb007a4f5c +size 25165824 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e291f0e8671865bd610ff24ee243cae3954a1d8 --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0445c397fb2e2805a4b427c9c703e04f24baccae1979a74887e9a9bc617d153 +size 100663296 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab210d26c6519d24fd3ecc8fa3bc41cc94b0f68b --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:792f9d2df6eb49b3bf8b72881ca3d2654f5cec7aca78e764b9189c229f7a9e9f +size 24416256 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..2284c0894c9e6698b56cec4c4f27af2c85ea6760 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25857e97783cca471551874e2508273e08585dd12ac5672b0719f886f01dc598 +size 35536896 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ff5dc742b0a428a211efc1f109f3489757efcf0 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86b7f17f0b7f8bed8ce0d8e4806d80e61bd6e5e1f80c9bcdf9aa1ba601c842f3 +size 50331648 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..5e8e79957bc37b942abf816651a2bdbe22f50a3c --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1af3e6350bd27080c91a130bf87af86032c4bf0d6bb533fc9c6d6c030537a41 +size 18874368 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..0abcf28c129f076cb38169a512dcaa1d3c91aabc --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0a50e653d49a86ae349cbcbccf2697910f36572187be3ca7e013325b658324 +size 25165824 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..52e3f4ecb46e28d36212d8607d08955d1923c6f3 --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1870c67d443bd984a962735300b96c01406fb9091bb28f59d69d0df1ed088820 +size 100663296 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..11e82f7f1364fe6a664badc43dfb637f651455e9 --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cea7e4f27a82051713262b5a34de587faaf7ca59f4161537fd5d0c06b9af83e +size 24403968 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..363e6af160417e6907414651de2c76a2225988b9 --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98504039e1f5d19ece619a83b0a765ddfbf79b5e48c8eceb7ae72186c8986776 +size 50331648 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..f28edf2fd4ecdb346f53abde51b2d7a54490a51a --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8b031cfe316ded5b49df1d439ce2f28758f78d9594f2cda0de1d58b71eef9ce +size 18874368 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..c80eb572e3bacb8c8174798b41c5c50f9590871e --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b257cb1ab3a21fbe7dfa7a802e79b12fe6b1f7eeb7ab01994ebdbee2e022530 +size 25165824 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..f72873219f3460b93562b29887e03387cc2a615f --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8245f273edbce645fd62d0545b58c56b4a27fb8bb107640d185b26a0e24612c2 +size 100663296 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..8c2eb1f815bb0b3083f5aecf1749480beadf4e52 --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3605f007472deefc1baeecce4aa18a232d4a5afaaa4100c7ff878da7a08c498d +size 24403968 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..6c4c52950295160e3882897a6486af3771f410b4 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8a347c5e71de27774115b5f7f3e24d8d6deb7e98766cae46f384da5991d7357 +size 18874368 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..326004f44f771fa99518a300ba801f7b5594f53c --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8a3dd5bf9416569ff529c044b199b768ba79cb02ce37047072842ac9d45d77c +size 50331648 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..3e750b3a67998b3ef8a1d8fea4d1a27bea9ae676 --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f19f7dbfabcff312d0f70bd9c359b3b9c5818f9da81537437fe74cefa4bf16 +size 18874368 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..1eb1ee35181e4b7b8af6c4b56ff0b93a5dc971eb --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee58329877eba87d02215ff37138ebe662a0c2c8ec6f93d7fdda2337ba51405 +size 25165824 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..021050e509d0be8c708823d6e039fc809cbb4c0b --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a717f2b5698306f1606e63e930b66e027db4b5c5a0a5e6911fa06e53b686ba5b +size 100663296 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..1235138055a1e8b42d672f77dc5c25be058a735e --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06558e0781d06e33f5701e3b41eeedb30f664850b92fb617d61af44ace814ccf +size 24403968 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb703cb6b5ad1e941aa0f54ecd3db4d85c40485c --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0468713280fd1ecedcd5e64c2711ba2fecbdbbba0dcaf2dd83fa6f353b76668 +size 50331648 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef8c1ed88e49ccdda65aca6d8901e9c7dadd8446 --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c0f559cdcdd4125596001acfe303b46b6874cccd3c04ec8f2a22c2e2798660 +size 18874368 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..16c6389e13ef40737800e0c45578ba5c88bbef3d --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35b693085fc0b6912f0cf0d7d82737c4e2f9cec35bae6b2603d4298d2d772d1b +size 25165824 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc61b9f3848ef8d083cc7bf2d3b0f2078119874e --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ffff906045f5425a59e86cd493dc46d9bbb9a09a7735876b5da45513a27777b +size 100663296 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..f64f9a3d43aa6763b2fbcf6c307959cc9bbd62cb --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:505f4715cfedf150ccb26508e5e7f10b7a3586a71afe9b5f18fece7ec525e04c +size 24391680 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..d4a2f73181ed2cb80f1e31379cf625cf0dbf97eb --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8414c88387435309f44080af3356eec3b1580b0ee83ccdaf5eaf2691a7bf31b4 +size 25165824 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..f67a0066a483744431a60f081a12091febcb13ca --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40882756d7f494dd8221a918470be90164aa8361425a009ad1e72f2d259e1c9c +size 50331648 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf3b01337366f59b0edd05b92865fc64d7c52ba8 --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a42554cacce30cb3054bac8e7dcfd2393c07d82dc4fe952790bc54b6a37db345 +size 18874368 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a83b257e4aecd0fdafe33efda41c0751609d490 --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70163d8a7e2f91702966e3fd01477ab564a55db2b7070ffca8364513dde80f07 +size 25165824 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..f2da510f387119b752c974a3445f15bf4899e722 --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:088e238a73b3897e28cda75f1d004e41d3720ff892f669f19c91192e38572d16 +size 100663296 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a4a25e0a33d505e59c525588f7ff2db489df253 --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96f8137e6aeafd4ac60c127180109c26df10178cc7b31613d1289c79bcf8e781 +size 24416256 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..e92635a0b93edcbe9a213f01dd6729305153c589 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89147aff40ca798f1928278186f776bdd1cb578a6d86f37fed8725e6fb08cd9e +size 50331648 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..b12c69b77609ad78cbe31061d7b942a9ce550234 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f31d543556fa3ef2f811e7041986528ca0d32d3fde373da1e40b2305373d21d +size 18874368 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..37fdc6ed906263f8a309e678f0c1c5c98765cd56 --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d1d4b20a7ee71e7cd4ff3a7c2495aab74669260c027fb8aa7d2c7f870f7d788 +size 25165824 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b108792315d70ac324b839496232f6aae1bff69 --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aac906c9f01121561d38f916132b47f1b9b518800ba00f34482489bc26abef10 +size 100663296 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..2d650934d9184af9507bd14b3b48addca63d1be7 --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10844a623c5454dbde8b01d4af36c9fd1c0f64e4d6a036613053bdfd6a2d3956 +size 24403968 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..0507a7f8f59f0dfa2e288352fd057110c19d23cf --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bdd22a33e469c226f864b7d84ca13d9a97aa1d18f5b6554a9abe9e7adbaa38e +size 100663296 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..d6b0e4c8c34efd5c182177e80e7e59c1d2d7b27a --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81decf437a0193edde671e460004612dd0f900e5f2b10559f310d5a0f24432f4 +size 50331648 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..5d5da27e91c13ca33b621b2a219acb32811dd74c --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c890550b2e57873b459a9c0d3502b69d15ff3f19cd72dfcec7e13c6dcc0a3c1 +size 18874368 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd91bb36869e81132e25e78019b363d534299986 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84b07421ab82169de1866970a5539612f33285309f9c451f4fe6f0e875ea8f8a +size 25165824 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..6d850007f75204ce2adbd0461e8fcb24afc01f8a --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87be0bf0a43c53c60ba856d8fa408298cb26ad8fd19ed597ed42adb93c0d977a +size 100663296 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..600cd86a2e01dc7edf8ff5a50c3762549bb36835 --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62ebdbeb02d6a42b94a96a97dc6270dd0897fde6d09fc1e8b1c2c0f78fa42e69 +size 24403968 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..68c8644e14aee68679bff07e4facc160718c15cd --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:351a2f7c2d0df915739f55bb0520b224177ecdc76b0ac2035112fba1829daf4f +size 50331648 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..b32a318e0ed9c30c5b25be514b15e48e54baa2b9 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2804354544e50efe802ca0ae23899a97e1f1084468283460f6a76347b0f9a34a +size 18874368 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ba444fba9a7e7f00ea433f49ee87ef0998bb52e --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1356cda4b4623b8b464ddf98f0aab01c5dd845c9b055441285838f48b303e4b +size 25165824 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..403512027005bdc9e1aaf9e495b020c68f44dd23 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8472c969b068e3347efa1845cae5129bcc1e5f9813e149908393e8afe925cce0 +size 100663296 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..117ccf17bf5b13c3e42eea7b67f7c71dbf9e2d33 --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26cd922327b0cf4bfd211a79fcd28b6fae830bd8376e977bda46a547b416c482 +size 24403968 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fe8f65311c44ae55a18bc129cdc2d9c115f0f41 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b47b7ed3ba3974950a2991827a1a91300ea68ea9c883501d4f314772799d24 +size 24403968 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..5a6e1f5efe72b72be834b40453c402db8c40ba93 --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14df3ad9062b475d8f0ea7e8c7cd8c41fb9fe9aad203f16b83d12ec3f855aa74 +size 50331648 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8aad65185b6bb117d4839b57148315fc5551f10 --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25a749029ba82b3921bee03ce58a351962a2e9e8ad621c744717d93c9bf2a198 +size 18874368 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..b5d58110fa595e394dd64aa354d8a641c9c06f60 --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0f9e39969c650641d0b6ca87466b8fec74dc4511f0f5ec1cba3e05941c014a0 +size 25165824 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..2713a2c41457d7472e5827e6ff344f0187f491e8 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acdb9fc0baec8bda65df97aece9cb0992b9bc3c72e100b2275d2ef8051f4bf1d +size 100663296 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a59ff79dedd2eb54b439d7523d47fd4eb8248e3 --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:989e8e2fd787d48553223b384beaf90539857bb28ef6e6d52ec8f1e2fc6fb839 +size 24391680 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..dbeefb90eecfb2313d962107ebd9d74bb7411cd5 --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9273a6ebc9cc23a239610e2dd3989474174c4b1c924513e20a90d1466a1fc98f +size 50331648 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a7a44ff08fe3abafdf6aabfd97a842450bf5730 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d2e22ae3edd884f9642f384c438338f23692dd65dfc78b287c47a2ec76e86ae +size 18874368 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..563694bc08dd3e89658c8e198aacf44c9c188298 --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68453288b2e37d806ec280367d42c5239d1857c7192d633c2ba0d72de3ddc376 +size 25165824 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..7686bae12fbb54ceee0332d6bcdebcb3beb21ce4 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d68d0054743d517651b56dd1d3afe9675f5ba6956b9121f697a77dd37da88a +size 100663296 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..5197a473b60071fbf08a1ceedaa1da9f3ac7df00 --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:979d1b60a1d0f8dcb8bc0cbd0ca28ce643cf87f31a6b1332d9ed11de1c4531a1 +size 24416256