diff --git a/added_tokens.json b/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..9c16aa4be022f03ad001b006fba14dfb73a1929c --- /dev/null +++ b/added_tokens.json @@ -0,0 +1,3 @@ +{ + "": 32000 +} diff --git a/ndarray-cache.json b/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..22309a34402fd0d5e837c0dc4d2821de4965902b --- /dev/null +++ b/ndarray-cache.json @@ -0,0 +1,7275 @@ +{ + "metadata": { + "ParamSize": 565 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 327680000, + "records": [ + { + "name": "param_0", + "shape": [ + 32000, + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 327680000, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_1", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_7", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_10", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_15", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 25497600, + "records": [ + { + "name": "param_2", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 0 + }, + { + "name": "param_3", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 1228800 + }, + { + "name": "param_4", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 2457600 + }, + { + "name": "param_5", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 15564800 + }, + { + "name": "param_6", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 15974400 + }, + { + "name": "param_8", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16384000 + }, + { + "name": "param_9", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 18595840 + }, + { + "name": "param_11", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 20807680 + }, + { + "name": "param_12", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 21913600 + }, + { + "name": "param_13", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 23019520 + }, + { + "name": "param_14", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 23029760 + }, + { + "name": "param_16", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 23040000 + }, + { + "name": "param_17", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 24268800 + } + ] + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_21", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_24", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_29", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_18", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_19", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_20", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_22", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_23", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_25", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_26", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_27", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_28", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_30", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_31", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_35", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_38", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_43", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_32", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_33", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_34", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_36", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_37", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_39", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_40", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_41", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_42", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_44", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_45", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_49", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_52", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_57", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_46", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_47", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_48", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_50", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_51", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_53", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_54", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_55", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_56", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_58", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_59", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_63", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_66", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_71", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_60", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_61", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_62", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_64", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_65", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_67", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_68", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_69", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_70", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_72", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_73", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_77", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_80", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_85", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_74", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_75", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_76", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_78", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_79", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_81", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_82", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_83", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_84", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_86", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_87", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_91", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_94", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_99", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_88", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_89", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_90", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_92", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_93", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_95", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_96", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_97", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_98", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_100", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_101", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_105", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_108", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_113", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_102", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_103", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_104", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_106", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_107", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_109", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_110", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_111", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_112", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_114", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_115", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_119", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_122", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_127", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_116", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_117", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_118", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_120", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_121", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_123", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_124", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_125", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_126", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_128", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_129", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_133", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_136", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_141", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_130", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_131", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_132", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_134", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_135", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_137", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_138", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_139", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_140", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_142", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_143", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_147", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_150", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_155", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_144", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_145", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_146", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_148", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_149", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_151", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_152", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_153", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_154", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_156", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_157", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_161", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_164", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_169", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_158", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_159", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_160", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_162", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_163", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_165", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_166", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_167", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_168", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_170", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_171", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_175", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_51.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_178", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_52.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_183", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_53.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_172", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_173", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_174", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_176", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_177", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_179", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_180", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_181", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_182", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_184", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_185", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_54.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_189", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_55.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_192", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_56.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_197", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_57.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_186", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_187", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_188", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_190", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_191", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_193", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_194", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_195", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_196", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_198", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_199", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_58.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_203", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_59.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_206", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_60.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_211", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_61.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_200", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_201", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_202", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_204", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_205", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_207", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_208", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_209", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_210", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_212", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_213", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_62.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_217", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_63.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_220", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_64.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_225", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_65.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_214", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_216", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_218", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_219", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_221", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_222", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_223", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_224", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_226", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_227", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_66.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_231", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_67.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_234", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_68.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_239", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_69.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_228", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_229", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_230", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_232", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_233", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_235", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_236", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_237", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_238", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_240", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_241", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_70.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_245", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_71.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_248", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_72.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_253", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_73.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_242", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_243", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_244", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_246", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_247", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_249", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_250", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_251", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_252", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_254", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_255", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_74.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_259", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_75.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_262", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_76.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_267", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_77.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_256", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_257", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_258", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_260", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_261", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_263", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_264", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_265", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_266", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_268", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_269", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_78.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_273", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_79.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_276", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_80.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_281", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_81.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_270", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_271", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_272", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_274", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_275", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_277", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_278", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_279", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_280", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_282", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_283", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_82.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_287", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_83.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_290", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_84.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_295", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_85.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_284", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_285", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_286", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_288", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_289", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_291", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_292", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_293", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_294", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_296", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_297", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_86.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_301", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_87.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_304", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_88.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_309", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_89.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_298", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_299", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_300", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_302", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_303", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_305", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_306", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_307", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_308", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_310", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_311", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_90.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_315", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_91.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_318", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_92.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_323", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_93.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_312", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_313", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_314", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_316", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_317", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_319", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_320", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_321", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_322", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_324", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_325", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_94.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_329", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_95.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_332", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_96.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_337", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_97.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_326", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_327", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_328", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_330", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_331", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_333", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_334", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_335", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_336", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_338", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_339", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_98.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_343", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_99.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_346", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_100.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_351", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_101.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_340", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_341", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_342", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_344", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_345", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_347", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_348", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_349", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_350", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_352", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_353", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_102.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_357", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_103.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_360", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_104.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_365", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_105.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_354", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_355", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_356", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_358", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_359", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_361", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_362", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_363", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_364", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_366", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_367", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_106.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_371", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_107.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_374", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_108.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_379", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_109.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_368", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_369", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_370", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_372", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_373", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_375", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_376", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_377", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_378", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_380", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_381", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_110.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_385", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_111.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_388", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_112.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_393", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_113.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_382", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_383", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_384", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_386", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_387", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_389", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_390", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_391", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_392", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_394", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_395", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_114.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_399", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_115.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_402", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_116.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_407", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_117.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_396", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_397", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_398", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_400", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_401", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_403", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_404", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_405", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_406", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_408", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_409", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_118.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_413", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_119.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_416", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_120.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_421", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_121.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_410", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_411", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_412", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_414", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_415", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_417", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_418", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_419", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_420", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_422", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_423", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_122.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_427", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_123.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_430", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_124.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_435", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_125.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_424", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_425", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_426", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_428", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_429", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_431", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_432", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_433", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_434", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_436", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_437", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_126.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_441", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_127.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_444", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_128.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_449", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_129.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_438", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_439", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_440", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_442", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_443", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_445", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_446", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_447", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_448", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_450", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_451", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_130.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_455", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_131.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_458", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_132.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_463", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_133.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_452", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_453", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_454", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_456", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_457", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_459", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_460", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_461", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_462", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_464", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_465", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_134.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_469", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_135.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_472", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_136.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_477", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_137.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_466", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_467", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_468", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_470", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_471", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_473", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_474", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_475", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_476", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_478", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_479", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_138.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_483", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_139.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_486", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_140.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_491", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_141.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_480", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_481", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_482", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_484", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_485", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_487", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_488", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_489", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_490", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_492", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_493", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_142.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_497", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_143.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_500", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_144.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_505", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_145.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_494", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_495", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_496", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_498", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_499", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_501", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_502", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_503", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_504", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_506", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_507", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_146.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_511", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_147.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_514", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_148.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_519", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_149.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_508", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_509", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_510", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_512", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_513", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_515", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_516", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_517", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_518", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_520", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_521", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_150.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_525", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_151.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_528", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_152.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_533", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_153.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_522", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_523", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_524", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_526", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_527", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_529", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_530", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_531", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_532", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_534", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_535", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_154.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_539", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_155.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_542", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_156.bin", + "format": "raw-shard", + "nbytes": 39321600, + "records": [ + { + "name": "param_547", + "shape": [ + 15360, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 39321600, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_157.bin", + "format": "raw-shard", + "nbytes": 23040000, + "records": [ + { + "name": "param_536", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_537", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_538", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_540", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_541", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_543", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_544", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_545", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_546", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_548", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 20582400 + }, + { + "name": "param_549", + "shape": [ + 15360, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1228800, + "byteOffset": 21811200 + } + ] + }, + { + "dataPath": "params_shard_158.bin", + "format": "raw-shard", + "nbytes": 70778880, + "records": [ + { + "name": "param_553", + "shape": [ + 27648, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 70778880, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_159.bin", + "format": "raw-shard", + "nbytes": 35389440, + "records": [ + { + "name": "param_556", + "shape": [ + 5120, + 1728 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 35389440, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_160.bin", + "format": "raw-shard", + "nbytes": 327680000, + "records": [ + { + "name": "param_562", + "shape": [ + 32000, + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 327680000, + "byteOffset": 0 + } + ] + }, + { + "dataPath": "params_shard_161.bin", + "format": "raw-shard", + "nbytes": 21641216, + "records": [ + { + "name": "param_550", + "shape": [ + 5120, + 640 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 13107200, + "byteOffset": 0 + }, + { + "name": "param_551", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13107200 + }, + { + "name": "param_552", + "shape": [ + 5120, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 409600, + "byteOffset": 13516800 + }, + { + "name": "param_554", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 13926400 + }, + { + "name": "param_555", + "shape": [ + 27648, + 40 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 2211840, + "byteOffset": 16138240 + }, + { + "name": "param_557", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 18350080 + }, + { + "name": "param_558", + "shape": [ + 5120, + 108 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1105920, + "byteOffset": 19456000 + }, + { + "name": "param_559", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20561920 + }, + { + "name": "param_560", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20572160 + }, + { + "name": "param_561", + "shape": [ + 5120 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 10240, + "byteOffset": 20582400 + }, + { + "name": "param_563", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 20592640 + }, + { + "name": "param_564", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 21116928 + } + ] + } + ] +} \ No newline at end of file diff --git a/params_shard_0.bin b/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..ece15ec1cc7c992a929d2dd2219d05ce83d421d8 --- /dev/null +++ b/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a1694544d7be05af747e5a33e20224a650a3a3c85ecaf3776756716f7c63cd +size 327680000 diff --git a/params_shard_1.bin b/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..cbda4dbf396c17d5d71c5d56f96894b0c915a317 --- /dev/null +++ b/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fda9d9fafcc89135636b4f1486ba9d496848f1b9e1604e282ccaf5adb013708 +size 39321600 diff --git a/params_shard_10.bin b/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..dcdfc8f8d57d6700f0ab32d48579208444632e1e --- /dev/null +++ b/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1dbe14205097244877c19efe33eec633e4bad1ea89f0548a09fafa3c8474e51 +size 70778880 diff --git a/params_shard_100.bin b/params_shard_100.bin new file mode 100644 index 0000000000000000000000000000000000000000..59a3f61ab9a9fef9eb1ec048365ab630d0dbfb21 --- /dev/null +++ b/params_shard_100.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55874b38300198e5944f25a208257fc80dae8768f93f563ce28e18465d883ea9 +size 39321600 diff --git a/params_shard_101.bin b/params_shard_101.bin new file mode 100644 index 0000000000000000000000000000000000000000..83e7145418f893b490f8ddb0464479d7c447e819 --- /dev/null +++ b/params_shard_101.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c6c8c9a1508d9f1c64cbbe8acceabcfd2bf449f60a7202d2dd303c9733f7028 +size 23040000 diff --git a/params_shard_102.bin b/params_shard_102.bin new file mode 100644 index 0000000000000000000000000000000000000000..e87f8e202b11d335b51d2463762a5d96b5495a59 --- /dev/null +++ b/params_shard_102.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e767dbac6fd550258f1f87945686a35be9ab417510dc471e1695fb40376c295 +size 70778880 diff --git a/params_shard_103.bin b/params_shard_103.bin new file mode 100644 index 0000000000000000000000000000000000000000..274a06da36a7255c379c3e67f1377718a186247a --- /dev/null +++ b/params_shard_103.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad19ed0d81fff94e5a695645393fd464aa2a1b9260e5b9ac547dbc5b8025bded +size 35389440 diff --git a/params_shard_104.bin b/params_shard_104.bin new file mode 100644 index 0000000000000000000000000000000000000000..9a8972b5862da78b9536df65f3445566a324b790 --- /dev/null +++ b/params_shard_104.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa2154678897df8626b3d3f910db08f924e2706741a01d7087c59136526670a +size 39321600 diff --git a/params_shard_105.bin b/params_shard_105.bin new file mode 100644 index 0000000000000000000000000000000000000000..4a9401aef3a42f97bb007dc8ed786629a8f6ced8 --- /dev/null +++ b/params_shard_105.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d16911a32a44fef5b07b0944d904a8a191e0f98d35202a159ee65ed166a5390 +size 23040000 diff --git a/params_shard_106.bin b/params_shard_106.bin new file mode 100644 index 0000000000000000000000000000000000000000..58e85d8fb805b917c01a0647dd94e6ca924b3129 --- /dev/null +++ b/params_shard_106.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08c29022678cebfc9bff9c949203f199ee6ceb748454a0702ae3042a00235057 +size 70778880 diff --git a/params_shard_107.bin b/params_shard_107.bin new file mode 100644 index 0000000000000000000000000000000000000000..8515310dda119ca028e854ea7f437ffd41b261d2 --- /dev/null +++ b/params_shard_107.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc1910a1d673466b65b3b6476bdba2e4a8736a701f65522a0ec5c2b9cb2816c5 +size 35389440 diff --git a/params_shard_108.bin b/params_shard_108.bin new file mode 100644 index 0000000000000000000000000000000000000000..8101a705be66c4977a080e0e4538942e695710d0 --- /dev/null +++ b/params_shard_108.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90be4b61c83012ec2cfebb813c865c050aff7ee6faedd9203340535c69e111d9 +size 39321600 diff --git a/params_shard_109.bin b/params_shard_109.bin new file mode 100644 index 0000000000000000000000000000000000000000..049535de33a1268556978fb0a7a6dd296212a1ab --- /dev/null +++ b/params_shard_109.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d60aa00dc796f035df511fdabccc6ae81fbac36992b1d7768def9012326f0c0e +size 23040000 diff --git a/params_shard_11.bin b/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef95bbf65dc3ee9242ba42b9a0a599a82e3587b8 --- /dev/null +++ b/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c6580f513436ba76a1d74595266db28b95924d5e07b5d7cc0590f807383308 +size 35389440 diff --git a/params_shard_110.bin b/params_shard_110.bin new file mode 100644 index 0000000000000000000000000000000000000000..e0c3270579c97281ed06ec1f600fe07eb9e04872 --- /dev/null +++ b/params_shard_110.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d546bb927ef5b52239a84dc2958cc70fd27d13b99ecb38ec37193ff69e3a7d7b +size 70778880 diff --git a/params_shard_111.bin b/params_shard_111.bin new file mode 100644 index 0000000000000000000000000000000000000000..81f196f5cbf713341197eea61b7e48c18a381b8a --- /dev/null +++ b/params_shard_111.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8473a224c577721c044ed728ea408c41b867ef240f799bfb639138e9d1a2a2e8 +size 35389440 diff --git a/params_shard_112.bin b/params_shard_112.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7b1c1bc3ea9473eefd587f60c313e20b47f790e --- /dev/null +++ b/params_shard_112.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5cdb721d7d4e97f00eee2da2a5af4ba88af4f25dff4f9c8634297bd62b7b6a6 +size 39321600 diff --git a/params_shard_113.bin b/params_shard_113.bin new file mode 100644 index 0000000000000000000000000000000000000000..04b3f0f6d4c1ddd0f66ae63373836bceefdd7c67 --- /dev/null +++ b/params_shard_113.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8225a3b23e99be0aeef52dc0fbb56c0c5c161c5f1e4728680b1c69c568592e6a +size 23040000 diff --git a/params_shard_114.bin b/params_shard_114.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ae1f1f5a4275f7923e6021472b7eb60bc728d29 --- /dev/null +++ b/params_shard_114.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098c618c13d195f2b6525f61316edb6e5ba318a559d82326005a31f67b520507 +size 70778880 diff --git a/params_shard_115.bin b/params_shard_115.bin new file mode 100644 index 0000000000000000000000000000000000000000..ae3970470697d269e208abad44fa4cc17c95c835 --- /dev/null +++ b/params_shard_115.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5e7f1cea4f24ef1ac4a847916e2806018a4eb24ca39f389093a928009175e1 +size 35389440 diff --git a/params_shard_116.bin b/params_shard_116.bin new file mode 100644 index 0000000000000000000000000000000000000000..d0e78fe2f32eec371877835d309ec839a4a9437f --- /dev/null +++ b/params_shard_116.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f5d17feaeb762e5074c4d95e47e92ebab6bd0dbdf4eba1bab191f2ee8bf811b +size 39321600 diff --git a/params_shard_117.bin b/params_shard_117.bin new file mode 100644 index 0000000000000000000000000000000000000000..cb695e09e4367ac3a676a461abb34c335cf172c0 --- /dev/null +++ b/params_shard_117.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6de3b1beac914dfd4cb2e4399222abd702157340a97bac23b4532ddcb421b2f6 +size 23040000 diff --git a/params_shard_118.bin b/params_shard_118.bin new file mode 100644 index 0000000000000000000000000000000000000000..4988e95cd6dd4f05fe3057140d3446d0c97462a4 --- /dev/null +++ b/params_shard_118.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c6ce8c125e16df46f438dc3752264c155535dbf61c888d0577d49dcd9879b4 +size 70778880 diff --git a/params_shard_119.bin b/params_shard_119.bin new file mode 100644 index 0000000000000000000000000000000000000000..dd9e3e20b70b8757007fb61d3544f517b21c7217 --- /dev/null +++ b/params_shard_119.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3108077b719bfbe9c72c63b9435bccd8c45e8d0916eee292ce871e8c21b91de3 +size 35389440 diff --git a/params_shard_12.bin b/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..aaed5b1d045fea296b017765f2ca7ed839f4eb1a --- /dev/null +++ b/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3763f6195964c027116885fce9e5e71b193469312fbd4eb3f58de5935146f89a +size 39321600 diff --git a/params_shard_120.bin b/params_shard_120.bin new file mode 100644 index 0000000000000000000000000000000000000000..66ebc5f1faaa1b0cbcea454383d11d3b557d0b2a --- /dev/null +++ b/params_shard_120.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3c6773e5feec35468630ef714d37d6e30a7fb069caec884706160ba082095f8 +size 39321600 diff --git a/params_shard_121.bin b/params_shard_121.bin new file mode 100644 index 0000000000000000000000000000000000000000..e43283f92a959f4e3674e9b45453fcece41bb474 --- /dev/null +++ b/params_shard_121.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0270dbe37457ae8ff97d42121029084bf2573b0935de2c79f99074af61c0c4ed +size 23040000 diff --git a/params_shard_122.bin b/params_shard_122.bin new file mode 100644 index 0000000000000000000000000000000000000000..c883d42e38824a75dbc19a2adce78364003f0897 --- /dev/null +++ b/params_shard_122.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f333b1883add955484ecd76bfcf9d7dcaf8cc6e32e674d1b576cba91de940b7 +size 70778880 diff --git a/params_shard_123.bin b/params_shard_123.bin new file mode 100644 index 0000000000000000000000000000000000000000..59705d46960d2e63aa4be96332a646430d3152a0 --- /dev/null +++ b/params_shard_123.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31428d2ca45e769e368f5359e0b0ec69e52d9bbb3d72b2074a55d591a90c4ac6 +size 35389440 diff --git a/params_shard_124.bin b/params_shard_124.bin new file mode 100644 index 0000000000000000000000000000000000000000..00a157e9eb671315337fa8be1fab769c6f7024b4 --- /dev/null +++ b/params_shard_124.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a96c3525e6f3b67710da3c87c4c1210ff3acb9328447d8138d4777f5aa65cde9 +size 39321600 diff --git a/params_shard_125.bin b/params_shard_125.bin new file mode 100644 index 0000000000000000000000000000000000000000..acb6d8e7b84f7c0f1821c54101ea7596fa6085aa --- /dev/null +++ b/params_shard_125.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c059b89b253acd93223039fe286bb4c36c8de44d6e40a5e3248f3cad7c1a4235 +size 23040000 diff --git a/params_shard_126.bin b/params_shard_126.bin new file mode 100644 index 0000000000000000000000000000000000000000..47617b07891072c1ff80aed6c49449c2a49d464b --- /dev/null +++ b/params_shard_126.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4707673486e3871ed943cab3ac70ba7ec662fdbca6ff33a552d1b4c9455db41 +size 70778880 diff --git a/params_shard_127.bin b/params_shard_127.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab19a4f9f62544e6a04614c28c3a8cb4ddece5f5 --- /dev/null +++ b/params_shard_127.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1587257f967084fc8e95b5160af19320fb680aced5f58a96593c0b058288ef92 +size 35389440 diff --git a/params_shard_128.bin b/params_shard_128.bin new file mode 100644 index 0000000000000000000000000000000000000000..7788d9aa01b7c8794a619bdb6a8d9f8ef3c1e6bf --- /dev/null +++ b/params_shard_128.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e664a2282d99a2eb3737d26e948ad4a1dc1501547f0216dcc01fe352694b0262 +size 39321600 diff --git a/params_shard_129.bin b/params_shard_129.bin new file mode 100644 index 0000000000000000000000000000000000000000..ff065f144334e0bef527da44c5a642539d43f9d3 --- /dev/null +++ b/params_shard_129.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00b31d9fef2a5e66c49411b2f7742a82bac093eaa0f051c6eeb6415a8cb27bf0 +size 23040000 diff --git a/params_shard_13.bin b/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..855a55d20410995595af84d68da8dd23915669d9 --- /dev/null +++ b/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de71ba74dfb4d48c131f68d8ceaa77b5927d1b22c8ba03019c29547fa5df62c8 +size 23040000 diff --git a/params_shard_130.bin b/params_shard_130.bin new file mode 100644 index 0000000000000000000000000000000000000000..826dfebb73a2dadb6844ed05e98a0fdd62ee7ae5 --- /dev/null +++ b/params_shard_130.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea8d23993b403c46dc8fa895b213c6841745a8c1f749abab095d0be79ca6050 +size 70778880 diff --git a/params_shard_131.bin b/params_shard_131.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8aef30f74b5ef89d661cd8702fa6cd0ef4bea9c --- /dev/null +++ b/params_shard_131.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0f41fcc6c1f1bbfcd47018938b3fb32aa320ffc6a5d9c94c63346d0ca8633d2 +size 35389440 diff --git a/params_shard_132.bin b/params_shard_132.bin new file mode 100644 index 0000000000000000000000000000000000000000..331c774451fe4443435e90bd5d5f592f887def32 --- /dev/null +++ b/params_shard_132.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b1f7c2327f419bf9ce52c13b3bca72a44d35d643acd64929c5938ec22ebf50d +size 39321600 diff --git a/params_shard_133.bin b/params_shard_133.bin new file mode 100644 index 0000000000000000000000000000000000000000..8dab9b7445f4c597b9b729ea9aa8017c751fd5c3 --- /dev/null +++ b/params_shard_133.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2891a2944496ff2ea3717fc4a3c430eca7f58c2eca76dcde2a27c7ae342fb5fb +size 23040000 diff --git a/params_shard_134.bin b/params_shard_134.bin new file mode 100644 index 0000000000000000000000000000000000000000..8be75e525bc195dd41d73bce2bde8536a9a4eea8 --- /dev/null +++ b/params_shard_134.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557158bd11dfca53debbc5728d1cde01c75b19c46edb7b44ea4b15b6b05954ed +size 70778880 diff --git a/params_shard_135.bin b/params_shard_135.bin new file mode 100644 index 0000000000000000000000000000000000000000..81856e720ca79bbd86ab4c352e699ba4dd7a1fd4 --- /dev/null +++ b/params_shard_135.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d887296f83d36c23cb1dd5c6cebf42bde7e07496cca4c0316a83f3e566ee205 +size 35389440 diff --git a/params_shard_136.bin b/params_shard_136.bin new file mode 100644 index 0000000000000000000000000000000000000000..4ae434857979dce713420909f8e52cb0a7d6f775 --- /dev/null +++ b/params_shard_136.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780a88164859c64d25dcaf95e070c6864ab99dd3935d24a24360fb1767125dbf +size 39321600 diff --git a/params_shard_137.bin b/params_shard_137.bin new file mode 100644 index 0000000000000000000000000000000000000000..6886c4e90c75d0b8d299691860f5e17b155c03ea --- /dev/null +++ b/params_shard_137.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55cdbe2b82d765ee9c40392cd964a54b337e8ca2e8c20622fbf0ce250b8e873 +size 23040000 diff --git a/params_shard_138.bin b/params_shard_138.bin new file mode 100644 index 0000000000000000000000000000000000000000..e8f6c98e631866a3a383f1da076da0290f259b2e --- /dev/null +++ b/params_shard_138.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aebf3306540a11d3cfaa8fd1c1199f2c2bf5f26619b269a0dee5dd4df861f7d2 +size 70778880 diff --git a/params_shard_139.bin b/params_shard_139.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9ab4ae7ee53888af633a4aa3e3e82d33f3f7120 --- /dev/null +++ b/params_shard_139.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec847c9ea1b3d77d398b513f9e9a5a06f0acc720b3b52b74f489d7f9b025e469 +size 35389440 diff --git a/params_shard_14.bin b/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..0d707e7573f4d72dca86c105848f953e99358697 --- /dev/null +++ b/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2572db0662a23eec44ab2164984cc8ec8f2cdf53890b91c45fb3e6d391194b62 +size 70778880 diff --git a/params_shard_140.bin b/params_shard_140.bin new file mode 100644 index 0000000000000000000000000000000000000000..e2ee2db63887d3d846e57c6ef2691df94a1c6524 --- /dev/null +++ b/params_shard_140.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e7d7ac582ddaa0815fed9f8a0edfb22e7c2ef7f69cbfbf0805eca85c1ffcb5 +size 39321600 diff --git a/params_shard_141.bin b/params_shard_141.bin new file mode 100644 index 0000000000000000000000000000000000000000..c79764476bf593714588d12d70489fc738120544 --- /dev/null +++ b/params_shard_141.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:311370259089218261aeb512604126bbd3350a4ae50c7a5fedd4406931addf23 +size 23040000 diff --git a/params_shard_142.bin b/params_shard_142.bin new file mode 100644 index 0000000000000000000000000000000000000000..ddd031e9dd827a9d3020457c586e7bf6898f07ce --- /dev/null +++ b/params_shard_142.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe2933127c134d77d0304834f3b4602fd32b1af7784bc5f8106281aa6439dd4 +size 70778880 diff --git a/params_shard_143.bin b/params_shard_143.bin new file mode 100644 index 0000000000000000000000000000000000000000..f6c52422954cce8c4fe34482a9a141a276b8244b --- /dev/null +++ b/params_shard_143.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a85acf391d567e1168dc71893afa96d6100f9b650d0952ad4cdcf06b8a963a7 +size 35389440 diff --git a/params_shard_144.bin b/params_shard_144.bin new file mode 100644 index 0000000000000000000000000000000000000000..74c6e19b5819ad2b126a39fa79ba903afa7ef69d --- /dev/null +++ b/params_shard_144.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08f4f56ddcb3c06f538b63b014df2e6b396841301ecc7ac5801020d3c17385b +size 39321600 diff --git a/params_shard_145.bin b/params_shard_145.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6f4a2eb4e8a2f77e9b99e0ba965d95ce7f7542a --- /dev/null +++ b/params_shard_145.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb6492e0b9f397b13e9751cf56670cf4ce7bcd3184ab91ee67c3c1a5cebb72f7 +size 23040000 diff --git a/params_shard_146.bin b/params_shard_146.bin new file mode 100644 index 0000000000000000000000000000000000000000..2345265a10ea95021bdf1c729beb5580f1f440c1 --- /dev/null +++ b/params_shard_146.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feb03cbb3e9896b067e107b63787ca231681b88d1c1a23bb17643132da8088ed +size 70778880 diff --git a/params_shard_147.bin b/params_shard_147.bin new file mode 100644 index 0000000000000000000000000000000000000000..1f6aeb9b56c5f3418871189590d9d32823cee95a --- /dev/null +++ b/params_shard_147.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9a7af28b7c272e265194fe84106ab7c6d15e21b6cd5a5ea3f8619c4ac26e35 +size 35389440 diff --git a/params_shard_148.bin b/params_shard_148.bin new file mode 100644 index 0000000000000000000000000000000000000000..fd0f48b7ae6115d3455bd3404aec4802b21c06eb --- /dev/null +++ b/params_shard_148.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d3e6a1c276406b76d481c991c9fa89102c9e6516fc3f67ffb4a323411d507a +size 39321600 diff --git a/params_shard_149.bin b/params_shard_149.bin new file mode 100644 index 0000000000000000000000000000000000000000..d908eb77e6637f2a354c6bd166e32339d6aecd93 --- /dev/null +++ b/params_shard_149.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8000e4587dc5fd9f6d749e1453e12f3acbbd68e4e7545d617688f92a1ffdd1 +size 23040000 diff --git a/params_shard_15.bin b/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..7242e401cd68b3e8f3ccdb20adc7680f2f3b3d1a --- /dev/null +++ b/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:928e7c17baf9f7eef3d2ff059391a3c9bbe4474c8a4680bd5e939a86c623588d +size 35389440 diff --git a/params_shard_150.bin b/params_shard_150.bin new file mode 100644 index 0000000000000000000000000000000000000000..343c3d0e3d1b59846495f09f265b965f929ae326 --- /dev/null +++ b/params_shard_150.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9450e56957863cf667b80224484e91921b0d35b44bdaa2e76df6e13f29487ee +size 70778880 diff --git a/params_shard_151.bin b/params_shard_151.bin new file mode 100644 index 0000000000000000000000000000000000000000..acbddb773e8723f8dd037934f0f7303dff30bf99 --- /dev/null +++ b/params_shard_151.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f0da2f147aac18b8eb46671eb97ccc451d32a84093576f69a30eb0694c951b +size 35389440 diff --git a/params_shard_152.bin b/params_shard_152.bin new file mode 100644 index 0000000000000000000000000000000000000000..ead6ecbaae0cfadbd8b41cc20930f338f5dd5816 --- /dev/null +++ b/params_shard_152.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b464288eaf877f5d6688abd12f442751dcba30f285eac323eca311483cdbf126 +size 39321600 diff --git a/params_shard_153.bin b/params_shard_153.bin new file mode 100644 index 0000000000000000000000000000000000000000..cdd424da9fb5e582e1b9ba58553024682e1f2db1 --- /dev/null +++ b/params_shard_153.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c0357a0a9e14f8618b24f58f3c25380245dc9aaf5045d78fb784cd98db2f6ac +size 23040000 diff --git a/params_shard_154.bin b/params_shard_154.bin new file mode 100644 index 0000000000000000000000000000000000000000..edf18f7023451e9364db2caa2e67401c0e859362 --- /dev/null +++ b/params_shard_154.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc3120ffa3897057cf56b0d73b7b237da957e6576b0e1c6b923abb79a78d95d8 +size 70778880 diff --git a/params_shard_155.bin b/params_shard_155.bin new file mode 100644 index 0000000000000000000000000000000000000000..19de3b9e43912e70f036dae577624727d6b484c9 --- /dev/null +++ b/params_shard_155.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2646c510884d3dac4c9e1f8ff0774664ecc93767f87f198ee7ee9fa43d906149 +size 35389440 diff --git a/params_shard_156.bin b/params_shard_156.bin new file mode 100644 index 0000000000000000000000000000000000000000..430a49659ec20035667d82d42520911baebdff0f --- /dev/null +++ b/params_shard_156.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc6f9a800ef0d4d894e6b3d408e261104328060df0b371eb8da616859b57f5cf +size 39321600 diff --git a/params_shard_157.bin b/params_shard_157.bin new file mode 100644 index 0000000000000000000000000000000000000000..00c417292d187184e9d1e21d813a76a88f715eb6 --- /dev/null +++ b/params_shard_157.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f221b6a123b362fe66b0b84a528b64d7e6d04b17c80dce2f0d143ab24da3c7e +size 23040000 diff --git a/params_shard_158.bin b/params_shard_158.bin new file mode 100644 index 0000000000000000000000000000000000000000..b0f3d1dd6485afc6f2711b8f37445739944fe13e --- /dev/null +++ b/params_shard_158.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5b61a982146a20079b62df7b3bab04d136c4c9c8ace4b2ddb2287c2890257b7 +size 70778880 diff --git a/params_shard_159.bin b/params_shard_159.bin new file mode 100644 index 0000000000000000000000000000000000000000..e19ebf6f7615aaf789e1f766c1298e12a914a91e --- /dev/null +++ b/params_shard_159.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c937b57a101f5db52fcd8a08537d3ac993e8ad8e6cf03065155dac76f17e06a4 +size 35389440 diff --git a/params_shard_16.bin b/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..ab2ee291ba5e8cea8068844f8d885aeab209563f --- /dev/null +++ b/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80c32f0d3ac85f8148e35a28e93f3419824c50532d575720ba22cdbd4e6dc3c8 +size 39321600 diff --git a/params_shard_160.bin b/params_shard_160.bin new file mode 100644 index 0000000000000000000000000000000000000000..c7f6711c52ecd7669b99a2746251017564a19d85 --- /dev/null +++ b/params_shard_160.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a8115a3b930d69b1a31c828ebc65a20864b9a5491e57dbfcffcd3d1044cbe9 +size 327680000 diff --git a/params_shard_161.bin b/params_shard_161.bin new file mode 100644 index 0000000000000000000000000000000000000000..a010a4e17661606c62b343d5f6e9ff63b65bd1b4 --- /dev/null +++ b/params_shard_161.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ded17dcbee5c0d45214b5e7c45669807844bfe5f27ee5449c587508597846d1 +size 21641216 diff --git a/params_shard_17.bin b/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7e214c53a11a6a5f1361432ca0ee69007e36f64 --- /dev/null +++ b/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ccfb7d724039ce387ef6e8cf20f791b2ee849382d4d65129fd9630652e268a8 +size 23040000 diff --git a/params_shard_18.bin b/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c813854fdb664f5f9d3bbcbc33ed6e0362ea134 --- /dev/null +++ b/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc6b498530781fb1814ae3e6a8e690882210357af3e3b197621c2ffb10c2157 +size 70778880 diff --git a/params_shard_19.bin b/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..44e6f06d8423b22098480fde73855f2f1c9060e5 --- /dev/null +++ b/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d834124b3230006aa78813d71cbcff11364da3c2f36009ce974917b98207214f +size 35389440 diff --git a/params_shard_2.bin b/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..3789d82edeebe09da51b0beeaaa30c72d2701ca2 --- /dev/null +++ b/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e67a2372f9d43c7919f74ccd90a38196f929d19ba600fbe223f62a856a9d2a0 +size 70778880 diff --git a/params_shard_20.bin b/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..3c83800bbdb18fd28c18d3dff660271add56f035 --- /dev/null +++ b/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00233223c8981d1ca3638a0d8794e4140b6c9531e9f5a3272b99255030affae +size 39321600 diff --git a/params_shard_21.bin b/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..09ecf73b68c9e33f564538297b257fbd8053844d --- /dev/null +++ b/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7677733eb909f04dfa14c5816a19fba03a3d684a0147f9379ca9f843d1e0ef51 +size 23040000 diff --git a/params_shard_22.bin b/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6844c356b511e8244acd1412556d7bacc9a4139 --- /dev/null +++ b/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cac4c76bdf2cbae8c712673a026f84bba0cb95f29d69514efa3be1f4561eb38 +size 70778880 diff --git a/params_shard_23.bin b/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..0784635785e7c03df064eedbf359d17374a97c0d --- /dev/null +++ b/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0ffdd3eee58ade1de60b7847ba0035f8deb2196b2d618be225f3c5daa71f5b4 +size 35389440 diff --git a/params_shard_24.bin b/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..17f85f337329bd814f5e52da722d5177c68629bf --- /dev/null +++ b/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e93f7ccddbb7864dd26cdc529827c15cba20c0797ce43599c12dba39aaaa378 +size 39321600 diff --git a/params_shard_25.bin b/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..07a20c96610d99b241a55359c5cc657876c46947 --- /dev/null +++ b/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c96dedd1a163136e8ffc747eb4efda16092fba8512e26b56b1cde0d1268fc34 +size 23040000 diff --git a/params_shard_26.bin b/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..2644a2205de42888591dc45749d2d018c4afd985 --- /dev/null +++ b/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dd54b318d8cb05459334dee41d369ce3b80757756e751a26cd83dc5d2b5d96d +size 70778880 diff --git a/params_shard_27.bin b/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..9f766a92c712686cfc884670a167d934ad01550e --- /dev/null +++ b/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0867932f62268b65c731e1915a85017a1ed47f84729775372eaa2f8b2bada69 +size 35389440 diff --git a/params_shard_28.bin b/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..3db966026712ea7b2a22be41cca699319d68f9af --- /dev/null +++ b/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab5a15fd96f994ab97c6934c859c4328c1db9d990b9da7b90e2bd40877e3cfb +size 39321600 diff --git a/params_shard_29.bin b/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..86298e7331adc30631c9a9e8a2641b7d5ccb3623 --- /dev/null +++ b/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81adf7c53998c17e4ab32c1a5295ae19aca02cb211430fcd08c4c099dcbea86f +size 23040000 diff --git a/params_shard_3.bin b/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..4be25187595baf166bf7ebfd6de0284076a3ad88 --- /dev/null +++ b/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad6f5feffa517b7e9ac8845306313594691a0757925a2662a0ad2eae7500b69 +size 35389440 diff --git a/params_shard_30.bin b/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..2415c4c0c3d9646aea114e287c34ffe1f16be89a --- /dev/null +++ b/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56a6909ab770eb12b5c8882ee38f5867326c4493ce214c2efeade6b1fa8443af +size 70778880 diff --git a/params_shard_31.bin b/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee025d6c142688dbe2556873b336d4f4612aa5d5 --- /dev/null +++ b/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a006da4f55390a5c054c34a8d3bee27eb7400007654efc56fcce2809825ef8b8 +size 35389440 diff --git a/params_shard_32.bin b/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..9bf0801c908545069209d5884678af1af0b658bd --- /dev/null +++ b/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507018b64fb6f1a886c1a6a62d0fffa94cabf9671ed885a0a722f1d4e80e247a +size 39321600 diff --git a/params_shard_33.bin b/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..945fd1b2d0b9d6852f0a083306bfb3e1a0d56e15 --- /dev/null +++ b/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1292a9f91ac2146cd8974cf07375d2aa0601fa8b706acc11fe9462a073ff3a87 +size 23040000 diff --git a/params_shard_34.bin b/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..9dbbf73b95153a5af68fa68a3b6ab008578b3681 --- /dev/null +++ b/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1206ed3165493a3879b121be78473075d3921d0c4201e78ae858d3c13b142b0 +size 70778880 diff --git a/params_shard_35.bin b/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..97e970f19afaf8cb4edd45b546482f01da86d495 --- /dev/null +++ b/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f7a272591ce28259c0dd201710abf770d9eb897d467b47ffc8665a2c1933ee +size 35389440 diff --git a/params_shard_36.bin b/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..ce9ab56b9d233dd8d41ad9bb025b343938ed9184 --- /dev/null +++ b/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4311f33de70d147efbbe7250cc32cf821e4b1a761ac37847188fccacac391ebe +size 39321600 diff --git a/params_shard_37.bin b/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..c6172793e82a39493e9cb829075886e30ddb94e9 --- /dev/null +++ b/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac03b6855a4322d1adf3752b1e7512977153204f5af896aff5435854a85381ec +size 23040000 diff --git a/params_shard_38.bin b/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa6affe1378e755c0856d5e244bdde411e9de353 --- /dev/null +++ b/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925a608a40072540ded2455878135645c970365be1a50c8d0ddbe9dfbbc5abb0 +size 70778880 diff --git a/params_shard_39.bin b/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..2e43c1d74217575abfa9c3b8351fb4ffeae74802 --- /dev/null +++ b/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8a258723030d0792c4d1a04e00d64c4fd3f10ef6bcac27f031608ce1faa1d7 +size 35389440 diff --git a/params_shard_4.bin b/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..94873674aa43d518f59692113f603109bd4a3826 --- /dev/null +++ b/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa9857bc29fd36cecb051c6c381d7ea130eff15c2b363d58710e62412ce1fdd +size 39321600 diff --git a/params_shard_40.bin b/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..1acad84a49b157413fe6e4dd3313e3a9c964f1ef --- /dev/null +++ b/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44cf70a635e587a822482bc348ebe986d9fc426c089d583636fffb203b5cbef8 +size 39321600 diff --git a/params_shard_41.bin b/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..e70b17e396d6e2c50fc742780f4189e35ab491b9 --- /dev/null +++ b/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a585ccef4270ee32b4e8c8950c2f6912dfa3392f46b170e59a1d29f90feb32 +size 23040000 diff --git a/params_shard_42.bin b/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..de49bf5a897dc8063d7cb3e3b9dccaae4008293d --- /dev/null +++ b/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66657378ecbd558563d98bdb241bd8d3a04f25113d8b422b5650f4b612ace79e +size 70778880 diff --git a/params_shard_43.bin b/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..4358f00be869e6103a2c0f8e956b4dabf622772d --- /dev/null +++ b/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc2a452423bc68b4de669bed0396c142121da178a466b1be13842e0039abda45 +size 35389440 diff --git a/params_shard_44.bin b/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..bc1424cedfd586583c27aff0ce1ee400ef241869 --- /dev/null +++ b/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a473943399ae5bd0671627a98d526654d039bb0b0e8a01fd4b21c34e11654828 +size 39321600 diff --git a/params_shard_45.bin b/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..d77175c28e9f647706066299811a3c26f9ae8934 --- /dev/null +++ b/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cfa9e7f7f201867dff5ddf7fa99d0df5f0755cdbb3e841291ec6efed3f34ea5 +size 23040000 diff --git a/params_shard_46.bin b/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..058394973eea0596c15e36d6ee5183ab913c8cea --- /dev/null +++ b/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea87b0c9d9a7d5199564730cf8e71d2c2d6fbd5282504273952866ad2893c13 +size 70778880 diff --git a/params_shard_47.bin b/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..5f09cb82d763670a76eb33aa0d51cf41d06f1bb0 --- /dev/null +++ b/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9f303f7b030ffe2f0161da307e1ed30c8fb2f3d425fe4d80842ef6985ce019 +size 35389440 diff --git a/params_shard_48.bin b/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..b9bd7cb4ea171b1134f9c8154da7c803e8bbc45e --- /dev/null +++ b/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86aedd5ff9ca106086f0b9da221230b3f952369f405470ccd97cc899eb912d36 +size 39321600 diff --git a/params_shard_49.bin b/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..215e3a72390d840007cafabf898329ee6f9447dd --- /dev/null +++ b/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c00dc634a3ade9e5556a6f9545ccea70b61d71ffefd5978f9a4da170d8669ef9 +size 23040000 diff --git a/params_shard_5.bin b/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..0922a87c1431da6921a28c34b4544cbe08f0a70c --- /dev/null +++ b/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8f6583d18275494efae7fd8240410ff9a9bfab2af31bc990eca1a13366addf3 +size 25497600 diff --git a/params_shard_50.bin b/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..14b7b4ff73cafa8258a12eb74ac35d669dee1bff --- /dev/null +++ b/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6255635ff441ceeb9c175315e9a595b03983e5c0ae8aaf774b2f353e0908110 +size 70778880 diff --git a/params_shard_51.bin b/params_shard_51.bin new file mode 100644 index 0000000000000000000000000000000000000000..bba0b3df83f8e90c966dfaee3291146e636ded54 --- /dev/null +++ b/params_shard_51.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84930599b03d746a523761ad3fd565635c7c79fa7b8a5ee4d494f6487bfce791 +size 35389440 diff --git a/params_shard_52.bin b/params_shard_52.bin new file mode 100644 index 0000000000000000000000000000000000000000..54ff590170bae7ab44d8add0dd259132f16834e2 --- /dev/null +++ b/params_shard_52.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86a8829674daae75f1aecf3de9dbf8ed36c2a287c899f5772ec60405a2e0522f +size 39321600 diff --git a/params_shard_53.bin b/params_shard_53.bin new file mode 100644 index 0000000000000000000000000000000000000000..ec46a0c74c5497e26a6274281937935dd5eff464 --- /dev/null +++ b/params_shard_53.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2efb846fb0e9052395a03c03cc6955891e9152d2739533206219f43d5e77a4c +size 23040000 diff --git a/params_shard_54.bin b/params_shard_54.bin new file mode 100644 index 0000000000000000000000000000000000000000..abd161b2b1145b979b0930d2c652195dbedafbfc --- /dev/null +++ b/params_shard_54.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca89fef2b8590e38acda8a6b5e5adef4b0c1983e8b4b451dec337699cd5d412 +size 70778880 diff --git a/params_shard_55.bin b/params_shard_55.bin new file mode 100644 index 0000000000000000000000000000000000000000..dc60fa513540c69a66fee5f67e2e683351a89b2f --- /dev/null +++ b/params_shard_55.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7306cbf93842b1ff23cae945970dbb2b6ab24e8f8367ab376edd3689c530bbb +size 35389440 diff --git a/params_shard_56.bin b/params_shard_56.bin new file mode 100644 index 0000000000000000000000000000000000000000..acc2bad52bd362f205a90ba5f34d4e64a1731e38 --- /dev/null +++ b/params_shard_56.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f05a95b556b61dd88d927c89bcbd05de1e6e3b002996ebff92fa76e5fb7c920c +size 39321600 diff --git a/params_shard_57.bin b/params_shard_57.bin new file mode 100644 index 0000000000000000000000000000000000000000..48d8c5adfa5ba329b6c342a4c0fb7e6599664507 --- /dev/null +++ b/params_shard_57.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f07754fda0dadafb97eab0288b4a1f81aaf57f4d027ed1596200ae34d9b194f +size 23040000 diff --git a/params_shard_58.bin b/params_shard_58.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa1536870fe21f5f608625b6e97354cd8af1b4d4 --- /dev/null +++ b/params_shard_58.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e33e649c4d5706c0e71f8f169907fbe9741644ed91135aa40497e9d678a08fae +size 70778880 diff --git a/params_shard_59.bin b/params_shard_59.bin new file mode 100644 index 0000000000000000000000000000000000000000..e6ba22f7a0bd9674d17210cfe4435d30f636760d --- /dev/null +++ b/params_shard_59.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9774891f33b3833e3785b75f71644d442cf48e6b5346c9d329f4799b59c9bf95 +size 35389440 diff --git a/params_shard_6.bin b/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..c00239b3466ad91b446dafc79b5f6a806e8754f1 --- /dev/null +++ b/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a515bd9168c448d003ac05deb2a66ad75a1bb8a323974d35169d17b8b1f5ed76 +size 70778880 diff --git a/params_shard_60.bin b/params_shard_60.bin new file mode 100644 index 0000000000000000000000000000000000000000..4e8283669927c85a4e17bb8278af33795d585501 --- /dev/null +++ b/params_shard_60.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d06da12bff3c53fe6419fdfdcc077cfc0863acd12e96c1b3cd7effca599b01 +size 39321600 diff --git a/params_shard_61.bin b/params_shard_61.bin new file mode 100644 index 0000000000000000000000000000000000000000..ed62b230a6407748fe7be3f1f80ea33e630bc749 --- /dev/null +++ b/params_shard_61.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f6c05075c721580b40e22a2047694b3ed18cab3a6633716553bc86e2338a5c0 +size 23040000 diff --git a/params_shard_62.bin b/params_shard_62.bin new file mode 100644 index 0000000000000000000000000000000000000000..c73fdc9fbe50d4de8e69682a44cccd2f98e7b8c2 --- /dev/null +++ b/params_shard_62.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c4ed71ae88b242ae1cb28729c86ec41eb1d88c586e67194ebf581b4be798f57 +size 70778880 diff --git a/params_shard_63.bin b/params_shard_63.bin new file mode 100644 index 0000000000000000000000000000000000000000..51d9d5b281fc59371ed22cf49c8f0fc9c17d2462 --- /dev/null +++ b/params_shard_63.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cc91eacbe10f43dffcc1ed6a6004925e398594c80a08d1eec380157298dea6a +size 35389440 diff --git a/params_shard_64.bin b/params_shard_64.bin new file mode 100644 index 0000000000000000000000000000000000000000..e422143f311ec933b02a2ea0e83b22c3902c44ce --- /dev/null +++ b/params_shard_64.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22a5b4840969a2ace7ddf35ecf3de082174add13510a25df08486c6a503bd9aa +size 39321600 diff --git a/params_shard_65.bin b/params_shard_65.bin new file mode 100644 index 0000000000000000000000000000000000000000..56326e50014304a97fee8793eb11b70987be9563 --- /dev/null +++ b/params_shard_65.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f02f9d2f97d404719f985f22705c53340d0c8c852a4d0803cef9a4622d77e85 +size 23040000 diff --git a/params_shard_66.bin b/params_shard_66.bin new file mode 100644 index 0000000000000000000000000000000000000000..d766f1ed9efd24edee40226f2ae69444797f30d0 --- /dev/null +++ b/params_shard_66.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85c22664b898bf353a534b84bebce3a02df8c8d30ba8e55d590bef986b436f9 +size 70778880 diff --git a/params_shard_67.bin b/params_shard_67.bin new file mode 100644 index 0000000000000000000000000000000000000000..03db72b02b0744aed27577f5eaa2819b8e27051c --- /dev/null +++ b/params_shard_67.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f00d58c2d55aa8331c6a10734bb158d01d764fc52a0e115ca726688cc73eeb69 +size 35389440 diff --git a/params_shard_68.bin b/params_shard_68.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ccc745e65200e16aa84edb3094b616bbc4f8c69 --- /dev/null +++ b/params_shard_68.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84c131b28c6e3723be27905fea76db0f39fe0fd32cbe61225ccb0dcab33b401 +size 39321600 diff --git a/params_shard_69.bin b/params_shard_69.bin new file mode 100644 index 0000000000000000000000000000000000000000..a963b5be20766dfddb49cf9ffe4ed5a65162384d --- /dev/null +++ b/params_shard_69.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:680ce8b3f823d7f70b7cd5a750bcb90944be6ca354cf4fba0ca9722b6bfccd13 +size 23040000 diff --git a/params_shard_7.bin b/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..51e0761af58954ae8db5c74d17c348dc92af20fc --- /dev/null +++ b/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8911e6386bb60d6b5472da458c122639d4dcf69ce1815b2871e741caabbc43 +size 35389440 diff --git a/params_shard_70.bin b/params_shard_70.bin new file mode 100644 index 0000000000000000000000000000000000000000..ac2465cc99be78ae7b39574b6abe245748cf9bd3 --- /dev/null +++ b/params_shard_70.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:080da6f2992a26df17f2d8ca4ec8f18ce5a5e46e493691ff4eeb1f8f1515cef3 +size 70778880 diff --git a/params_shard_71.bin b/params_shard_71.bin new file mode 100644 index 0000000000000000000000000000000000000000..babb6e1bf617319ef9284092b0bdd92a0274db89 --- /dev/null +++ b/params_shard_71.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a3e63feaf27323f85445fdb98b1392c22afd428e3bd8cb4a394668d37ec43b +size 35389440 diff --git a/params_shard_72.bin b/params_shard_72.bin new file mode 100644 index 0000000000000000000000000000000000000000..da0cc80a3dc78b805ee47bc0cabad2a40f7ab0c0 --- /dev/null +++ b/params_shard_72.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5fca2356a37ba1d7306bee098585a87e645dbf38d55dbc695725d60d11e7452 +size 39321600 diff --git a/params_shard_73.bin b/params_shard_73.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c9e62935e7e9c7deccfcfe4ff94e8e9fa0dcfd1 --- /dev/null +++ b/params_shard_73.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2739c5f5d92ac54601d8c2f9553ce8bdd37641060b0819cdaf5f1e0648ead04 +size 23040000 diff --git a/params_shard_74.bin b/params_shard_74.bin new file mode 100644 index 0000000000000000000000000000000000000000..774022ece8ac269b1f8eaff4ebcd0fa4d12f24d7 --- /dev/null +++ b/params_shard_74.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84cc437b610a19d83e976a5645ddb334d07f990c133d52a90b5f6ab46eb18186 +size 70778880 diff --git a/params_shard_75.bin b/params_shard_75.bin new file mode 100644 index 0000000000000000000000000000000000000000..03cade45f1b68e50fc0a78e11a2fc0a34d1f97c9 --- /dev/null +++ b/params_shard_75.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:109f548243d2f960e9fce8c5aa8e2acca3c7fdfcd7e84a4c9f7de97280d63349 +size 35389440 diff --git a/params_shard_76.bin b/params_shard_76.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa9e53bf6263e8dd8669634e934eeaa00d888a16 --- /dev/null +++ b/params_shard_76.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9de7baec751497d67dfd4f80bea1ca948a8d64521b4e49b4d4f2afb9f680379 +size 39321600 diff --git a/params_shard_77.bin b/params_shard_77.bin new file mode 100644 index 0000000000000000000000000000000000000000..75e372a0dfccf5cb78bebb649a8e60bc25a7342b --- /dev/null +++ b/params_shard_77.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29e457f6beed42d9d2a094cbbfeaf2b705c6eb69ef811ec13f3a0d63c2ea0afc +size 23040000 diff --git a/params_shard_78.bin b/params_shard_78.bin new file mode 100644 index 0000000000000000000000000000000000000000..69c5696b154dfb7963de54a492ee4587f44c1320 --- /dev/null +++ b/params_shard_78.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f939200b6490c6ef5ca0b19b62ae88f08a92e0b99c29fee2e2f64d3f1894d7 +size 70778880 diff --git a/params_shard_79.bin b/params_shard_79.bin new file mode 100644 index 0000000000000000000000000000000000000000..6532a98d67964bf0b110cb86dd48bf96e303b6a7 --- /dev/null +++ b/params_shard_79.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96cb65710d056a2211be6d16b803438616712e905cd193eb006a1bf4924b59d3 +size 35389440 diff --git a/params_shard_8.bin b/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..2c0f49309338dbe853a2e0b5da3f2855ca5f1244 --- /dev/null +++ b/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910cf2872ad505ad56c5f1ccf59bf922f0222f9999df3eb26f280a13dc6d47cd +size 39321600 diff --git a/params_shard_80.bin b/params_shard_80.bin new file mode 100644 index 0000000000000000000000000000000000000000..68e8c951649174a174904d43ad2a68d129942179 --- /dev/null +++ b/params_shard_80.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b5fe09b93bde1432ed87074fd3cb7552d66ee40015d14e86dc24f52842c7a2 +size 39321600 diff --git a/params_shard_81.bin b/params_shard_81.bin new file mode 100644 index 0000000000000000000000000000000000000000..6436ff0a3e3ca157a1c4ddce02c87ed9bbb0e0f0 --- /dev/null +++ b/params_shard_81.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7b08d8b21e15e575a0a35cb55c485848995bdc4d86e91bf79f421219fec5352 +size 23040000 diff --git a/params_shard_82.bin b/params_shard_82.bin new file mode 100644 index 0000000000000000000000000000000000000000..6ca7aaacb4681ae744f6a659a28585ca6143fee0 --- /dev/null +++ b/params_shard_82.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2a90de2e79da323f71fc257c90963a2d404a67f9cea1c9490b6b3b6ae9a8c2e +size 70778880 diff --git a/params_shard_83.bin b/params_shard_83.bin new file mode 100644 index 0000000000000000000000000000000000000000..c896af06e2189552f9741d787ad09a4b5e6433c7 --- /dev/null +++ b/params_shard_83.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec58c9a3aa71813d58a59f483458e70211da2007ffddda547786ee6f434ab5d +size 35389440 diff --git a/params_shard_84.bin b/params_shard_84.bin new file mode 100644 index 0000000000000000000000000000000000000000..310c08e5bd31a014a3b0a9fe6103feceb5c05a54 --- /dev/null +++ b/params_shard_84.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5632dd0fc1b3bb0c1ef86c6e7c9baf87313bd4e38f2af60df095f1bbfb3f839 +size 39321600 diff --git a/params_shard_85.bin b/params_shard_85.bin new file mode 100644 index 0000000000000000000000000000000000000000..608f3c921b4f8d154d7ddd4bc3d6c7b56e9d9137 --- /dev/null +++ b/params_shard_85.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7277656d9319902963802e7cccba95a00c43a355c65495ca0a588256b557a7e6 +size 23040000 diff --git a/params_shard_86.bin b/params_shard_86.bin new file mode 100644 index 0000000000000000000000000000000000000000..c61c42212d5c89a72b21212956ad66232b0b77f6 --- /dev/null +++ b/params_shard_86.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20bd0d32454a55dfb05ef6b3182cf5ca8c8d5817a42ff91bd044fd5b4bc6c0ca +size 70778880 diff --git a/params_shard_87.bin b/params_shard_87.bin new file mode 100644 index 0000000000000000000000000000000000000000..99ba11872f6f77631d789f4d1e110da0e980978d --- /dev/null +++ b/params_shard_87.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9faa3e4ec07b09842f41c503c6417be7c695bbca49f63cf7bac54fcdd7da15f2 +size 35389440 diff --git a/params_shard_88.bin b/params_shard_88.bin new file mode 100644 index 0000000000000000000000000000000000000000..e46d427dc424664ae72804b5880e1fd6ccb72eb1 --- /dev/null +++ b/params_shard_88.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408acce958c7911405372fcdb956d16910bb9234e7968c0c8d121ebdcc7259b0 +size 39321600 diff --git a/params_shard_89.bin b/params_shard_89.bin new file mode 100644 index 0000000000000000000000000000000000000000..1dc364a74c093b0700402065ca54e3c1fdcb1e08 --- /dev/null +++ b/params_shard_89.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98706e9168da26770b7691b3ead02384b857f375989ab32dae761b93686a7427 +size 23040000 diff --git a/params_shard_9.bin b/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..b557202cbe5a4bbd10ebf3bf9cfe621244544863 --- /dev/null +++ b/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378ce9dd7c73defe0608fdbe512a498c3bac99ff7965bb1161d6c3759c1057f5 +size 23040000 diff --git a/params_shard_90.bin b/params_shard_90.bin new file mode 100644 index 0000000000000000000000000000000000000000..4705d5145fab55894fec28c93e17ee6932479152 --- /dev/null +++ b/params_shard_90.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:507f85b760ccb707a283137b580f996983eaf5554a0bf7c39c5e05bfc21d3dd5 +size 70778880 diff --git a/params_shard_91.bin b/params_shard_91.bin new file mode 100644 index 0000000000000000000000000000000000000000..a549763bb6d84562ee2df6d2a797acbec94b0266 --- /dev/null +++ b/params_shard_91.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f7b0f20d2167a735dce7c9c59994731305ec0ff2c93d26153ad198d851ce42 +size 35389440 diff --git a/params_shard_92.bin b/params_shard_92.bin new file mode 100644 index 0000000000000000000000000000000000000000..34b19f7b6a5bbc0a10f7dcdbc6213b98e5e61bca --- /dev/null +++ b/params_shard_92.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45b6e7f3e2f3e1ff16c90e62be5dc7943d14078e25a8b1a48c4f3323f1c9338a +size 39321600 diff --git a/params_shard_93.bin b/params_shard_93.bin new file mode 100644 index 0000000000000000000000000000000000000000..467864eddd2c04677d89dcdc0e67bc4e93e75a55 --- /dev/null +++ b/params_shard_93.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58dd909f0b73dc0fabc155df87754e553a00d5e6ad8b91ed47a5d637dade81f1 +size 23040000 diff --git a/params_shard_94.bin b/params_shard_94.bin new file mode 100644 index 0000000000000000000000000000000000000000..3af6c196fc544de69e2148afe3a8f40756e04e8a --- /dev/null +++ b/params_shard_94.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9fb3ea4ce0c50f54bb1db12cf664f27834f327d177e0b0491e3c4c9d9c6f29 +size 70778880 diff --git a/params_shard_95.bin b/params_shard_95.bin new file mode 100644 index 0000000000000000000000000000000000000000..b51cfdad34f0f4ee093c200170e87b297428ecbd --- /dev/null +++ b/params_shard_95.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40746cdcbe9dc3c82b8608a7eeaf71743fb3f0acb949aba639702cae5c82f6f7 +size 35389440 diff --git a/params_shard_96.bin b/params_shard_96.bin new file mode 100644 index 0000000000000000000000000000000000000000..0eecbde23520d5933c44a9e4062e28cdae481ff5 --- /dev/null +++ b/params_shard_96.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edbf55e9c37e3f436160c93b02c6b6b52cacb2c86d6b167b8beda21633e337da +size 39321600 diff --git a/params_shard_97.bin b/params_shard_97.bin new file mode 100644 index 0000000000000000000000000000000000000000..b90c4cf3f186c6f2da5b1583d3576ace205cae3c --- /dev/null +++ b/params_shard_97.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e73ebb52ab9e6b20cc2f2817e4109fbd1eb29f3e72a27bca0d4d53b9a4cb04 +size 23040000 diff --git a/params_shard_98.bin b/params_shard_98.bin new file mode 100644 index 0000000000000000000000000000000000000000..efa35fa3db3fb508ebcf799aab5efea0c5249489 --- /dev/null +++ b/params_shard_98.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63613941e3aba51fa960db0f1642c6eaabbd57caf37ee0667b8d719fbb2e7d15 +size 70778880 diff --git a/params_shard_99.bin b/params_shard_99.bin new file mode 100644 index 0000000000000000000000000000000000000000..d7b1171061fee063e70ffbe9f9f9fdb77988481e --- /dev/null +++ b/params_shard_99.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b69c8c9334af3f2941bce89b379b2019474d9bae65edcd894efb7f56e601445 +size 35389440 diff --git a/private-llm-config.json b/private-llm-config.json new file mode 100644 index 0000000000000000000000000000000000000000..75e3a6ec8e12a298019d83756126a45087f7e709 --- /dev/null +++ b/private-llm-config.json @@ -0,0 +1,20 @@ +{ + "model_lib": "MythoMax-L2-13b-w4a16g128asym", + "local_id": "MythoMax-L2-13b-w4a16g128asym", + "conv_template": "llama_default", + "temperature": 0.7, + "repetition_penalty": 1.1, + "top_p": 0.95, + "mean_gen_len": 512, + "max_gen_len": 2048, + "max_window_size": 3072, + "num_shards": 1, + "shift_fill_factor": 0.3, + "tokenizer_files": [ + "added_tokens.json", + "tokenizer.model" + ], + "model_category": "llama", + "model_name": "MythoMax-L2-13b", + "vocab_size": 32000 +} diff --git a/tokenizer.model b/tokenizer.model new file mode 100644 index 0000000000000000000000000000000000000000..6c00c742ce03c627d6cd5b795984876fa49fa899 --- /dev/null +++ b/tokenizer.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347 +size 499723 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..542a9fc8ddb435681466bc3cb708a735f04f5235 --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,37 @@ +{ + "add_bos_token": true, + "add_eos_token": false, + "bos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "clean_up_tokenization_spaces": false, + "eos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "legacy": false, + "model_max_length": 4096, + "pad_token": null, + "padding_side": "right", + "sp_model_kwargs": {}, + "spaces_between_special_tokens": false, + "tokenizer_class": "LlamaTokenizer", + "unk_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "use_default_system_prompt": true +}