diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..83d6990ad08c244dcef678082c5ffc9ffd85fb4a --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,5 @@ +{ + "<|end_of_turn|>": 32000, + "<|endoftext|>": 50256, + "<|pad_0|>": 32001 +} diff --git a/mlc-chat-config.json b/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..8ad427a1c8a9c20e6b90f699a6945a5bbbb618cf --- /dev/null +++ b/mlc-chat-config.json @@ -0,0 +1,23 @@ +{ + "model_lib": "CodeNinja-1.0-OpenChat-7B-q4f16_1", + "local_id": "CodeNinja-1.0-OpenChat-7B-q4f16_1", + "conv_template": "gpt2", + "temperature": 0.7, + "repetition_penalty": 1.0, + "top_p": 0.95, + "mean_gen_len": 128, + "max_gen_len": 16384, + "num_shards": 1, + "use_presharded_weights": false, + "shift_fill_factor": 0.3, + "tokenizer_files": [ + "added_tokens.json", + "tokenizer.json", + "tokenizer.model" + ], + "model_category": "mistral", + "model_name": "CodeNinja-1.0-OpenChat-7B", + "vocab_size": 32002, + "prefill_chunk_size": 4096, + "sliding_window": 4096 +} diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..20b5f3d4da3dfff8a79cb8d9dee23ce9d907a108 --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,4587 @@ +{ + "metadata": { + "ParamSize": 327 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 131080192, + "records": [ + { + "name": "param_0", + "shape": [ + 32002, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 131080192, + "byteOffset": 0 + } + ], + "md5sum": "d4e42e9148f99bf819c8e340f3f8ebe9" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 33358336, + "records": [ + { + "name": "param_1", + "shape": [ + 32002, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192512, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 8192512 + } + ], + "md5sum": "533ac3c1cebb9a24ce393720ae8eebfe" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_6", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "246ace4829a8c121502051b7acc98e70" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_8", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "5184df8f4b44e3e0fdc79466b96e171b" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_12", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "fd283673dd6b6915fb217ff313c45357" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 16777216, + "records": [ + { + "name": "param_14", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 0 + } + ], + "md5sum": "ff96de09265db71b0b6c67c779fa80af" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_16", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d8c06913867a240a2c3c2a66e5dcd69d" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33046528, + "records": [ + { + "name": "param_3", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 0 + }, + { + "name": "param_4", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 1572864 + }, + { + "name": "param_5", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 18350080 + }, + { + "name": "param_7", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 19398656 + }, + { + "name": "param_9", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 26738688 + }, + { + "name": "param_10", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 30408704 + }, + { + "name": "param_11", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 30416896 + }, + { + "name": "param_13", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 30425088 + }, + { + "name": "param_15", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 31997952 + } + ], + "md5sum": "94d6d15aa7d2f24aa79c858322c5f1a0" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_18", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "fd7e063f61febe5842c69787018ab04b" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_22", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "1fd3345da6eed45f03c98179dd3ce7dd" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_26", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "37dc9b6977d36ae543cfccf9c86432a3" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_17", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_19", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_20", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_21", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_23", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_24", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_25", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "98fe8aff0eda423aeb02b0f4e5aee145" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_28", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "21ba07b44780a57826d9c72015176d70" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_32", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "0325c7e3e4a83d591efb8e35b58b58de" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_36", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "950faa6dce8262ad25db4546a6e7b6c8" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_27", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_29", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_30", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_31", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_33", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_34", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_35", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "0cafd8aba04a1e27a51ba119ce5bfa20" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_38", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "b3ec33b46e2ac1402f033a2e1ee6c477" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_42", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "a8c453532bc085a23d7ba7d03d420e5c" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_46", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "8a4ecd64b7c85191384537953b69a44c" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_37", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_39", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_40", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_41", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_43", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_44", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_45", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "e95e2e16d2fd2e99701fe34232f52ba0" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_48", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "a127eb2ea65f6d7a82d48979e8fca070" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_52", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "d27ee0dd078dd199dab9d19b1743a0d6" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_56", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "d8c81357a55cd0e307c772f806f8a7d1" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_47", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_49", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_50", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_51", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_53", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_54", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_55", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "3275d5bac495350f026e3150e13c82ac" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_58", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "fd4873040126f39d6f241caad798e2f0" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_62", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "582230dd32de8a90e9d6a1fc689e8d55" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_66", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "f5dfbbe0438e9423e3d83310dd368eae" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_57", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_59", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_60", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_61", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_63", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_64", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_65", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "fe060680e9efbe860c77c4b156cd54b8" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_68", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "3b2fc0040fea0a140381ae32c4380113" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_72", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "559630bc33a5a79a57a21973b1157c14" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_76", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ed8c944d5f2a8d07cff1427a3545a488" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_67", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_69", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_70", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_71", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_73", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_74", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_75", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "6c382a9d037d6049eb82f27e6cf365de" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_78", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "c4ae498cdc4bbaa24d058e22daf4089c" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_82", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "82e289d986dcae615b3b8a876c2b6cc9" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_86", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "a7bb013ec3c43134701887bd3a7757e7" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_77", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_79", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_80", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_81", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_83", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_84", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_85", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "8228592ef4e526ccabea45a5a79f797f" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_88", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9757dc8c43a251131d199a32060832d1" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_92", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "f1ea6f667a151fd11b85849508279e06" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_96", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "13b4bb407d45f7124e4376cb3dd44bde" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_87", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_89", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_90", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_91", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_93", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_94", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_95", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "9763a933c9b8dad31956fb984c35b84e" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_98", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "1b49c6c91ac4aa90995c81bd306e4538" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_102", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "b0812ea87be2f207908bbc27b0db5ff2" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_106", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "509141b2af170b5be0945a5ee46320f7" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_97", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_99", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_100", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_101", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_103", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_104", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_105", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "07423db5fa268ea31e26e173c64b51f1" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_108", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "8cde19d752b16ee45463245f174c22c3" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_112", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "b08e73a6d42bea3162067b5ba630f251" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_116", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ab2b1c188e6b4a3b647f62685bc60e72" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_107", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_109", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_110", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_111", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_113", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_114", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_115", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "c033c05106abece7369d8c7af5e80985" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_118", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "55838c71f1f9af8325ce8758ea6ce82a" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_122", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "0cfe470a4e9113b82d1ac7b34f2696f9" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_126", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "ea41389588ca18eb5fbdf2986947a26c" + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_117", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_119", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_120", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_121", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_123", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_124", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_125", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "7937ad058476b05c86230c73c95cee41" + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_128", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "8fd14b4c955a02a810596b183c719fb0" + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_132", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "61b86ae751a1b4e64430a7b9d9a2c0a4" + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_136", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "113f78e495bee6a14a60df8906078b24" + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_127", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_129", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_130", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_131", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_133", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_134", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_135", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "2b41ecdf503fee6843e266a968aa0a1d" + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_138", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "871c3e8077f15a92f24bfe83313aba46" + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_142", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "119902fc71741f66ebec8ce95bd6e8b7" + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_146", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "85a5088a58a470fad8579c5dd614d4b0" + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_137", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_139", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_140", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_141", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_143", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_144", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_145", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "2a7219b690ae487e96d7824e4667c9ab" + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_148", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "fb3c8309cf37c5d43b658119009eddd0" + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_152", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "f327f7c8497988aacc572ddb6b931900" + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_156", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "b287dd02e5c05f0ae74cb3082637dc76" + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_147", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_149", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_150", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_151", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_153", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_154", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_155", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "eff61fd2663f9001e21b432f9c4bebc2" + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_158", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "af3a6be6f390a156ae8143dbaff9e030" + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_162", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "94df1a4f008e3fba0952563eeee390c7" + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_166", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "bcbad1eea720e1038539ba3037b08d7b" + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_157", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_159", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_160", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_161", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_163", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_164", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_165", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "5ebbff1c9f4de5f68b770f4b73ad6729" + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_168", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "cb9b892a701c53c9de9e09ce01584de2" + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_172", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "84dd787de4e19c0cd5466039e8110fed" + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_176", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "a4ebd717fd5053492332d7520cae868f" + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_167", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_169", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_170", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_171", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_173", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_174", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_175", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "fa756e6a63e67910cc8d7ca07791b685" + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_178", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "f5e6fcb1df8bc47fe6af6d6cf6f50745" + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_182", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "1b7892fadceb5b2942d2775683a72e1b" + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_186", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "abc2c2a9141b701919dcbb203e66ad3b" + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_177", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_179", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_180", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_181", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_183", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_184", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_185", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "316d2e1efea90261433b916ee4ca1008" + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_188", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "373fc3f3d07fb6f696f602ab99622c30" + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_192", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "6215dab4fd0f50d346780c5a326db1f6" + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_196", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "3e60558301600b9cf781052880d16ad0" + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_187", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_189", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_190", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_191", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_193", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_194", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_195", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "0fee86ad2efea2dea77d485123ef72ca" + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_198", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "7936543ac2e48f9c16933501493dd75d" + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_202", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "3d4fa13dab6843b60bd82c5a4eb36985" + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_206", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "fea25c9eff0fabcd47abf24d0fcfdc2e" + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_197", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_199", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_200", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_201", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_203", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_204", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_205", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "e0d6fcf9f3d40b97304f63e9130f3a2d" + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_208", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "f3472b0b877a83c870d421067bf69844" + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_212", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "bec37e459b2ca2e6989a19636d795b95" + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_216", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "eeb5cedcffc763ad3f8ae3614fc33613" + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_207", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_209", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_210", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_211", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_213", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_214", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_215", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "a0ce067a9082950548b7d3db500f3dd5" + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_218", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "ca2b55755500c03f5ba2c58f400ff1d6" + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_222", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "f89618a58169a45cc67d2cc4c6f37605" + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_226", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "5696088558afbfaa454da266fe482ab8" + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_217", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_219", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_220", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_221", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_223", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_224", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_225", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "98b07647d32570dd4487e31b7fac6035" + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_228", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "3bd764db70e37346e37da72f2a2f8617" + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_232", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "75561e72042c1cf8d732dd9515df40a0" + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_236", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "192676549d05937f1e8f5d4d6a24d3c7" + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_227", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_229", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_230", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_231", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_233", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_234", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_235", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "0f75f03666fc7c114d609d9778bbbbc0" + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_238", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "c0fbd89174a062d186e4777211214ade" + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_242", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "2be75fed42ebdeb3235ee0d25e9ff156" + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_246", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "88c7c16db850e02d01a88dd5d3bf5ac7" + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_237", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_239", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_240", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_241", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_243", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_244", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_245", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "712c349be5659c199f9d5673712564df" + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_248", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "522616f11700960ec2a61c78d5ce40f1" + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_252", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "945b213d3478f3cfc3c69a4152a9b0b5" + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_256", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "f4159c8919d9ab8fbdfe5a23d4b64c87" + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_247", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_249", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_250", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_251", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_253", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_254", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_255", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "1eb178a7bac4103fb50123cf77b7fecf" + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_258", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "a735b6a1e2eb7200c659cd0d6181b051" + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_262", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "2b00b0e3e29b218e6acf92c33f7dcd30" + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_266", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "590c8fa46052121c8b65283c6aff03bb" + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_257", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_259", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_260", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_261", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_263", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_264", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_265", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "e057d4701e6b202b3b57883007d413a7" + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_268", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "398257e9bc04b782f708f874235a49ac" + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_272", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "0818f440930b650e2600af74a04035bc" + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_276", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "2be0e0a7c4ee0c31b2ebc41b7f379458" + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_267", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_269", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_270", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_271", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_273", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_274", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_275", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "24ef2ac84f33fdc7e09f9d78a0630647" + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_278", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "fe207259cea5e7cb07e01cc0d5618e2f" + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_282", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "4060022d1db58ff20e87060a69a602db" + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_286", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "f6d92aa8f572520e2ffcbf3d9949da20" + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_277", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_279", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_280", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_281", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_283", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_284", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_285", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "f6bebcc8bf2bea9efc3e63a71e0db457" + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_288", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "529ab500c8c2598f1cbd24248d7e8313" + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_292", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "4618c31a56099803fd72fa582a3daf5b" + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_296", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "25e0c1bdec54d8e79ba96c17a27fb63a" + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_287", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_289", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_290", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_291", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_293", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_294", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_295", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "a8e651ef39b26a15408d8f16be37bacf" + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_298", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "4667074b0995c834b9db045b8185e9ce" + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_302", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "1854553dd3dc53e411f72fff08d519bd" + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_306", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "027907c8700d2224bc6b7e5cfbf9dd37" + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_297", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_299", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_300", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_301", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_303", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_304", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_305", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "7d3c7fb7d291aabc0ffd2fd25fe14dbe" + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_308", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "9baa191de834936da1b048caa3657652" + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_312", + "shape": [ + 6144, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "6d6ee027cd3e938bb4488955e6d3ee35" + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 117440512, + "records": [ + { + "name": "param_316", + "shape": [ + 28672, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 117440512, + "byteOffset": 0 + } + ], + "md5sum": "13baa68fd4c1d91b388edc4bfeb1c239" + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 30425088, + "records": [ + { + "name": "param_307", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_309", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_310", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_311", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_313", + "shape": [ + 6144, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 11026432 + }, + { + "name": "param_314", + "shape": [ + 4096, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 16777216, + "byteOffset": 12599296 + }, + { + "name": "param_315", + "shape": [ + 4096, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1048576, + "byteOffset": 29376512 + } + ], + "md5sum": "09e8710553132c113b7e373bfccab470" + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 58720256, + "records": [ + { + "name": "param_318", + "shape": [ + 4096, + 3584 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 58720256, + "byteOffset": 0 + } + ], + "md5sum": "b16eadd3e28f541220f43efe4d8452f9" + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 131080192, + "records": [ + { + "name": "param_323", + "shape": [ + 32002, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 131080192, + "byteOffset": 0 + } + ], + "md5sum": "28eec06f54c412092587fe4cd3085179" + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 20275712, + "records": [ + { + "name": "param_317", + "shape": [ + 28672, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 7340032, + "byteOffset": 0 + }, + { + "name": "param_319", + "shape": [ + 4096, + 448 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3670016, + "byteOffset": 7340032 + }, + { + "name": "param_320", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11010048 + }, + { + "name": "param_321", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11018240 + }, + { + "name": "param_322", + "shape": [ + 4096 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192, + "byteOffset": 11026432 + }, + { + "name": "param_324", + "shape": [ + 32002, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 8192512, + "byteOffset": 11034624 + }, + { + "name": "param_325", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 19227136 + }, + { + "name": "param_326", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 19751424 + } + ], + "md5sum": "25f2ef97444060ccae6e37a716122957" + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..22d9ae5f35c59edfeafee1d3300a9871f9c1535c --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a98380c7bd728d9b861593a777c31c06a29b53d854b320c868de64d82acfbbc2 +size 131080192 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..9e4d9b52832ffb938f3183d049221879136122bf --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94752cb990e6429c77079cd310acf9b49dd09781543d2e1babfdac745187b1b9 +size 33358336 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..da33dd1be31b14cec9da290d604302d04d31422a --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcc0e26bdccf315a54aee4393a8978db1753ee2519cd61335106a39df2e84ff6 +size 117440512 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..eb103dd00a6311f85cbb80e94d824278517185dd --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72c701f65d5389430bc471365c9cefd6e53fe93ae29517c46ed348c1d71f572e +size 30425088 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..a7189fb85a9bee011b582ee03c7c60151c440f70 --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14488d1a788579c3be9278d33fe44d4f104c2bd0e9c4eab9fcbb55df5643a175 +size 58720256 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..16027d47634f20198f8a47653815ee6097fed2be --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5461d470e62ea97a3d810b74b6e74a5c58c74f218102a4c60fa2ef18ea28c5c +size 25165824 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..aa7134609ebe946a088fcc939833fd22139ba3a1 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ce828ab43b3623b44a44a4478fd44336356e13c3c69302a72ca583b9995116 +size 117440512 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..3114205ad6f681fc50d2968d6d6a06e66d4cee69 --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2b3eed53bbd907e52fda46d545276fc232b3f47929b4629542f1321361ec0c +size 30425088 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..dcb217c17013be867db93a197c2cd9467d535c7e --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a26c88670a598e03c970054cd577ead25c68413dafa47524b2c439aac0443964 +size 58720256 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..934559679e9f11c339e9d228f08a7a17a1dd728d --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d27ea23e9769a4118401f8fb5f8e4563bf5db4a55747e153967c8349428eece4 +size 25165824 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..37f9a9097448f3f8c7c71e78bef81aed68b563f4 --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8ffb9540d1acf240683620a7127c05f354c9b93b7cde5bd02a5b0457605d33 +size 117440512 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..144920272a8537f5a7314ed3e462efb1284ae945 --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35317b0d54493381d03917dd04b0399be8384c97ea72e3ba1fd8f44ed528d214 +size 30425088 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..0cffe8abeb651828c5dbadc7098bac4f9ae7d2b6 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083e6a905129589088122aefe32c07032eacf42c97bb2d00a699e15c249265d1 +size 117440512 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..f6815d4929cda5c33dbd748f330b2b1ce422d1e5 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d695bdae4f85127c7d2cdc397593cfd427a22f3132f0e67c7e289c5751c8e77c +size 58720256 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..daaaf2467a10f891f9dbc5eb4d156380956249d4 --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62d55d3c974243c2fa78c76f8eff8d0e15f46d69c30431767b0be3c45366f10 +size 25165824 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..773419228473dee0f56942d39fb2d2e094aa00e7 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbae5d9d167767c71408b4906ad95cd443da7d582478397a8416bd19a4cb2164 +size 117440512 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..991b2e24e16f881ebc19cacc7db642e550ee38be --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7cee3fc8dbcdae9c2347358a653874eeada6980fdee57f146a8566542edc8d +size 30425088 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..a1b802cfead1ea251015f834330b7ddfb3c64a8e --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe376644cc1f0beb40ad9d19279ffbcccdbbb476fa732ead2438a6b16458d231 +size 58720256 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..ffc5376a24e484749c8bda375bfa5e89f6937fbf --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ffd0a29cd1b0253bf0b9853e759bba08fff158bb9ffd9301c42600368263b99 +size 25165824 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f460e48f98c08ba219834e581e5c831af09d5a1 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc8b5fdc4b045f425e62546ec41eebfc373b5b731ee99a9299769ed835d49bbe +size 117440512 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..992fd43f30dcda0843caddf803966290239aaed2 --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc9f8e883d0cf934c7df9e05d1ace89ac11b743e7afcdd26a738e9fb10c79d6 +size 30425088 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..5bd997a052c488daa74aed00cb790429369aa4e7 --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5399b97dd54d1a0887330b9a967e3ff1f8523abb0a26f7f50914570134d0e53 +size 58720256 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..0b7f551252592f31f3dec8d634239857fc559677 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9defb838f1e2d4f8f37d1fe564d4a01fd3bfe521b62f1ed1b8c7167594456aa +size 25165824 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..b6fa434c65d757580b8300572ff94d9e248b0690 --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f597c7d84e087668f2ce3a6eed109cf1624fa4d97796fad55224eef12666bad +size 58720256 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf7d1d8277ca174c2030be1cfbbacba79a142b45 --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10453d81de58b40057ca21d02d7d35fe27cfbebce35c5605693421c37c388390 +size 117440512 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..f30f6be8444c04e32cd881b7f1fadb0b512f94e2 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4859ce42e04b42d3616f0fb2755bb6646adb98a45123174e1d77efc02e29c2a +size 30425088 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff7121d31d5b368e827b9150ea5dbf4b9692a682 --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b36bcb87e57c27c4941bad1116621b1140cda143649f97403f2b41510e06b5ed +size 58720256 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..a9e0f1caa8d6f690a33bfd93a346799c9f7a92b3 --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ae00a1c91d723dd6c3626f18bc6aa17ec74be4b179f86fcebf1d9a2c6f96084 +size 25165824 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..c40f053018dfaed3a0818b131744f79bebb7219b --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0660bf13363be8b89dc1bdfd8626f9f0be69532c83d4d8f64c3af84aa6bab8a7 +size 117440512 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..e50e91b8b2b6f493659b659ac2461be17d1c8ca3 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e5e99c33cd9ffe430fedf6f4fc83d0aee7d1099eb62d6984d91d34db8d5bb4f +size 30425088 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb8cd261fd71323e29b13938318576e1d72a6a43 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b13428a4d39bbf63949e34c13d446c46326b19f591a08841fb45b060c2004da2 +size 58720256 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..dad2726e5a9ee8139902fbbedf198010020ee745 --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e999078ce8661367a53a6da21c1c59fd22b7d575dd0fe2c5c41d613d938190 +size 25165824 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..d13f418f6554654a06a43a1f91a9bfa246b65138 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b98755e63df8e2325e9a12d7db07e3ad6b653e762bfb195e22cfc1db90bbe912 +size 117440512 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..b008292e1933a4dac57dac2037f494bafa0de940 --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48242f3b0ed7aa737295698dbbcbca26ddd5654cce71a7b2bd176b85c3fa8720 +size 30425088 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..02c312663fb935036276ee6cf54c7a00a52a4db4 --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:009459d724b32af6c7812f267ba5582ca42dbc01936dfaaab1f4783ec95fb9e2 +size 25165824 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..285312c4043851b392f9ff3ccc7f387f1b470784 --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a9b3949b9fb84d1d5c2dd1cdec4ff15fe1a6cd70da2c88b3151f8fd87ff9447 +size 58720256 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..9ad4b95ec1eda35b9176bd9a60ec6946b4cb1b55 --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e05c7e07aaf2b94138fd3a23f18eccd352c8cb58a88082819a9c9d9366b429c5 +size 25165824 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..9fea1ac8e8a38080cdf7eb32324190ffe1e789a8 --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93c5c965adb30f68bc03faa47724a61069de759efbda2862fa86b4fdccf24552 +size 117440512 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..8f83227a540364418f34735db4a993c8cf5ede3d --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ec84a02094b2e76a121781077490fdbf1104c95efcc8c55f26b19a68f5b230 +size 30425088 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..baec39da7de1dfd761952ec0374affe1d9c26aea --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d95471e1688f3765bcf2e53d354c1406b83c4fd035157a18c48d89af7f027358 +size 58720256 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..e3395c4864156f6616aceef8efd1a31cabcce71b --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb0214ee1f69a987648926025dff36505b5b0d12c372e6028e5d70309750212e +size 25165824 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..056269435d7238acfc6a12e25677a90a812fc474 --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d510e3f8ffdf53eb58ee365af74ad5041d81c4f3e090f04d89ba1bb4cc95a12d +size 117440512 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..b4d18faf50e0179745b4ed89f1c841fdaa07d20c --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d7ebc83f19ac3defb47f292fedaf45dd743d2c3cbd610c96425b4e664dfad7 +size 30425088 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..ca99e2ebc2bc43e2a26235ef8e4268a8dac14afc --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c978df1548f25d12da2cadb2bdc80083b0b94ca423184e435ef27b873181363e +size 58720256 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..06ecdd108a0f4ab34a5875392d56759d1cc795f4 --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac34ccd7f2c4c7055f4eebd3d9f97f9cc1d69de076f3f0823276a3f40ec8605 +size 25165824 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..8e3f4d4546aaeaf45d313f7ae4c92ecbf43c48d3 --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f54fd0b81b28ae75f784bc4855b3c21d3069de3a37a5e31bc24234a4b19628 +size 16777216 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..8bbd12e6c7eebe1c1ab1b2d48c6f11fbbdc75ac6 --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e8f61b176debdd5b538363e67035f70712a85949dd86e655302b06b7de20a23 +size 117440512 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..141a9f1f3e9c9fce2a435116215774a494e44be1 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bb526c23fa6feb953e403a8379a3571a4733bf2cdeb3837ae623bb8bc990d27 +size 117440512 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a198cfaa8e0d208afcea75d672b826ff60bb796 --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8589fb2db7c3495f3c9c94131038778a21d3af652823a2eee6898b6411548851 +size 33046528 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..e9051ed04c036ad44ee1ebaf35578a57d2b50a3c --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ee143a2670da31e0cf9d277d423e96a55367d1ee1f2096e42ae1aeef14f38c +size 58720256 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..23554804ab704f7d04b2ef6847cf9fd69e405e97 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:176a460777de50a78776b2d29aba37b4ca06dabdc4c7a33758bab76a32da501f +size 25165824