diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..52b264d3f421335397ffaf36aba6ee4d3a211b59 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +*.so filter=lfs diff=lfs merge=lfs -text +*.dll filter=lfs diff=lfs merge=lfs -text +*.lib filter=lfs diff=lfs merge=lfs -text diff --git a/MiniChat-1.5-3B-q4f16_1-vulkan.dll b/MiniChat-1.5-3B-q4f16_1-vulkan.dll new file mode 100644 index 0000000000000000000000000000000000000000..a3a97889aa61c7c5fbfcbef22568f1852007af60 --- /dev/null +++ b/MiniChat-1.5-3B-q4f16_1-vulkan.dll @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be81332f4249e7fcc4fff237d988064112d77280f06a6ced02a35232c932d90c +size 26675712 diff --git a/MiniChat-1.5-3B-q4f16_1-vulkan.exp b/MiniChat-1.5-3B-q4f16_1-vulkan.exp new file mode 100644 index 0000000000000000000000000000000000000000..392890074d066c4e2feeb6903b4edfee5990ae35 Binary files /dev/null and b/MiniChat-1.5-3B-q4f16_1-vulkan.exp differ diff --git a/MiniChat-1.5-3B-q4f16_1-vulkan.lib b/MiniChat-1.5-3B-q4f16_1-vulkan.lib new file mode 100644 index 0000000000000000000000000000000000000000..f9b1d3fd98070b0a88d67a87d240e67dfafab7c1 --- /dev/null +++ b/MiniChat-1.5-3B-q4f16_1-vulkan.lib @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea706f1d92d34e752c22794cde07923436f6c807ac8cd1bdb0136d44b842245 +size 14110 diff --git a/params/mlc-chat-config.json b/params/mlc-chat-config.json new file mode 100644 index 0000000000000000000000000000000000000000..777f3d51ab87c37311b4a4e2401990167dd6e2f6 --- /dev/null +++ b/params/mlc-chat-config.json @@ -0,0 +1,21 @@ +{ + "model_lib": "MiniChat-1.5-3B-q4f16_1", + "local_id": "MiniChat-1.5-3B-q4f16_1", + "conv_template": "llama_default", + "temperature": 0.7, + "repetition_penalty": 1.0, + "top_p": 0.95, + "mean_gen_len": 128, + "max_gen_len": 4096, + "num_shards": 1, + "use_presharded_weights": false, + "shift_fill_factor": 0.3, + "tokenizer_files": [ + "tokenizer.model" + ], + "model_category": "llama", + "model_name": "MiniChat-1.5-3B", + "vocab_size": 49216, + "prefill_chunk_size": -1, + "max_window_size": 4096 +} \ No newline at end of file diff --git a/params/ndarray-cache.json b/params/ndarray-cache.json new file mode 100644 index 0000000000000000000000000000000000000000..9cbbb52f11a941661db7f9fd6994e280ed54a111 --- /dev/null +++ b/params/ndarray-cache.json @@ -0,0 +1,3083 @@ +{ + "metadata": { + "ParamSize": 247 + }, + "records": [ + { + "dataPath": "params_shard_0.bin", + "format": "raw-shard", + "nbytes": 75595776, + "records": [ + { + "name": "param_0", + "shape": [ + 49216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 75595776, + "byteOffset": 0 + } + ], + "md5sum": "ecf15d3f0901ab7456e8e0af8ced507c" + }, + { + "dataPath": "params_shard_1.bin", + "format": "raw-shard", + "nbytes": 25165824, + "records": [ + { + "name": "param_6", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 0 + } + ], + "md5sum": "9bbebd6e9fb88198483ac084144d55a6" + }, + { + "dataPath": "params_shard_2.bin", + "format": "raw-shard", + "nbytes": 30683136, + "records": [ + { + "name": "param_1", + "shape": [ + 49216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9449472, + "byteOffset": 0 + }, + { + "name": "param_2", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 9449472 + }, + { + "name": "param_3", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 23605248 + }, + { + "name": "param_4", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 25374720 + }, + { + "name": "param_5", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 30093312 + } + ], + "md5sum": "2e5970708026d9b687364767425202cb" + }, + { + "dataPath": "params_shard_3.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_7", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_8", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_9", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_10", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_11", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_12", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_13", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "9f934199d76c5d26646f3d545ab72fff" + }, + { + "dataPath": "params_shard_4.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_14", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_15", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_16", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "a3cb6df79e4429abc2be010fedfc51d1" + }, + { + "dataPath": "params_shard_5.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_17", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_18", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_19", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_20", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_21", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_22", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_23", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "abf83c3c7e851bb5767f197da8cb1dac" + }, + { + "dataPath": "params_shard_6.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_24", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_25", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_26", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "6ce898064ed0861322bbf62e9d70d729" + }, + { + "dataPath": "params_shard_7.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_27", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_28", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_29", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_30", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_31", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_32", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_33", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "172bd66af74d0e34491ae5bb801be91a" + }, + { + "dataPath": "params_shard_8.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_34", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_35", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_36", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "80622e63178dc3e00ced75b53b23fd35" + }, + { + "dataPath": "params_shard_9.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_37", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_38", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_39", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_40", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_41", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_42", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_43", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "1b105ec9d866d775cb69379c40757f88" + }, + { + "dataPath": "params_shard_10.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_44", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_45", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_46", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "8ca5fd22e33b7ecfc4edb22c2429bea0" + }, + { + "dataPath": "params_shard_11.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_47", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_48", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_49", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_50", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_51", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_52", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_53", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "33dbf522d5e71a2c9c80bba1cd630861" + }, + { + "dataPath": "params_shard_12.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_54", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_55", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_56", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "ffc57c8bae42beb9ca8bd2f58a9e4b90" + }, + { + "dataPath": "params_shard_13.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_57", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_58", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_59", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_60", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_61", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_62", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_63", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "7000c9ae4c55bccc6d8d4ff1cbfd6543" + }, + { + "dataPath": "params_shard_14.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_64", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_65", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_66", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "948f3bbf1c76842dde7f1b9831212144" + }, + { + "dataPath": "params_shard_15.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_67", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_68", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_69", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_70", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_71", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_72", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_73", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "32bec1a6997ffbfd0ab9e93f56b9ad87" + }, + { + "dataPath": "params_shard_16.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_74", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_75", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_76", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "8711c6302582fddaa4c9e7ed91a75c7b" + }, + { + "dataPath": "params_shard_17.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_77", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_78", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_79", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_80", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_81", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_82", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_83", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "29147a956d8177b8d4b5c57754a7d670" + }, + { + "dataPath": "params_shard_18.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_84", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_85", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_86", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "1471ebee434c1147a18f440f09f98e91" + }, + { + "dataPath": "params_shard_19.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_87", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_88", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_89", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_90", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_91", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_92", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_93", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "0e32a9c897b51680f461e8b1008f5701" + }, + { + "dataPath": "params_shard_20.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_94", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_95", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_96", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "e26e42c69c260b3bb2ab55694b1482fa" + }, + { + "dataPath": "params_shard_21.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_97", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_98", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_99", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_100", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_101", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_102", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_103", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "ae647c3f3d6a097e5470cf69248d3a63" + }, + { + "dataPath": "params_shard_22.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_104", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_105", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_106", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "871acb8160143ca04a5347cc79ec7885" + }, + { + "dataPath": "params_shard_23.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_107", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_108", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_109", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_110", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_111", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_112", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_113", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "a98b06905334de6643492605ed0fa08f" + }, + { + "dataPath": "params_shard_24.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_114", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_115", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_116", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "a7627fcb0b8897ad5b778e2bfb633481" + }, + { + "dataPath": "params_shard_25.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_117", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_118", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_119", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_120", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_121", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_122", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_123", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "cc15fd71e7ae435df5d24ac8efc7914b" + }, + { + "dataPath": "params_shard_26.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_124", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_125", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_126", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "871cb0c0da0bd2b0fa86f5bd027f7cd4" + }, + { + "dataPath": "params_shard_27.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_127", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_128", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_129", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_130", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_131", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_132", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_133", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "1372630bf1cc3c793393c4caa9676037" + }, + { + "dataPath": "params_shard_28.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_134", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_135", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_136", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "384bce670c71430046a8c55f604dd2be" + }, + { + "dataPath": "params_shard_29.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_137", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_138", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_139", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_140", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_141", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_142", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_143", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "c88b13da2066d10551cebd5ab92a2ce0" + }, + { + "dataPath": "params_shard_30.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_144", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_145", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_146", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "810e6f3b5ab150f4900dd1022ab0a40f" + }, + { + "dataPath": "params_shard_31.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_147", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_148", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_149", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_150", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_151", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_152", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_153", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "7831b6ba62b41e173d6a10fa2505a728" + }, + { + "dataPath": "params_shard_32.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_154", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_155", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_156", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "46f5b5049ec0bd2f0244115053cb08f1" + }, + { + "dataPath": "params_shard_33.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_157", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_158", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_159", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_160", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_161", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_162", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_163", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "d35e67cff788996fcbb377a37c2988e1" + }, + { + "dataPath": "params_shard_34.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_164", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_165", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_166", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "b773d61b73cbac065381e20361f4367d" + }, + { + "dataPath": "params_shard_35.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_167", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_168", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_169", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_170", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_171", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_172", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_173", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "26e5ed8698a8e8652345ff38879bd502" + }, + { + "dataPath": "params_shard_36.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_174", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_175", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_176", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "7c8d29c2e7398736627702453541c286" + }, + { + "dataPath": "params_shard_37.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_177", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_178", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_179", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_180", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_181", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_182", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_183", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "662ba7267d5620fd903802819eeb9788" + }, + { + "dataPath": "params_shard_38.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_184", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_185", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_186", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "7fca258deddd082906005d8c6b594562" + }, + { + "dataPath": "params_shard_39.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_187", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_188", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_189", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_190", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_191", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_192", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_193", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "5bf417a7fac3087ed714131189075816" + }, + { + "dataPath": "params_shard_40.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_194", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_195", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_196", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "c82817e7f5c165463d841e9a9c842997" + }, + { + "dataPath": "params_shard_41.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_197", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_198", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_199", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_200", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_201", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_202", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_203", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "b05284a92d345b891b61d066f50d565b" + }, + { + "dataPath": "params_shard_42.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_204", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_205", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_206", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "bfd684dbf1519a513ace0f048c2a39be" + }, + { + "dataPath": "params_shard_43.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_207", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_208", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_209", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_210", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_211", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_212", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_213", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "815087a3375fae098120207cf73606b6" + }, + { + "dataPath": "params_shard_44.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_214", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_215", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_216", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "5065ca3fd598a6582c10353f8a48f235" + }, + { + "dataPath": "params_shard_45.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_217", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_218", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_219", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_220", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_221", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_222", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_223", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "bdb40b4e92059de1100895fd5336fb7c" + }, + { + "dataPath": "params_shard_46.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_224", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_225", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_226", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "7a8e6878b7e620871f7b65301ec72550" + }, + { + "dataPath": "params_shard_47.bin", + "format": "raw-shard", + "nbytes": 33239040, + "records": [ + { + "name": "param_227", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_228", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_229", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_230", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_231", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_232", + "shape": [ + 9216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 14155776, + "byteOffset": 17313792 + }, + { + "name": "param_233", + "shape": [ + 9216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1769472, + "byteOffset": 31469568 + } + ], + "md5sum": "c4867c41c853d1d3c30bc04aa840956b" + }, + { + "dataPath": "params_shard_48.bin", + "format": "raw-shard", + "nbytes": 30474240, + "records": [ + { + "name": "param_234", + "shape": [ + 3072, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 4718592, + "byteOffset": 0 + }, + { + "name": "param_235", + "shape": [ + 3072, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 589824, + "byteOffset": 4718592 + }, + { + "name": "param_236", + "shape": [ + 16384, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 25165824, + "byteOffset": 5308416 + } + ], + "md5sum": "a80e5c1d5f2df058f023a47d703174a3" + }, + { + "dataPath": "params_shard_49.bin", + "format": "raw-shard", + "nbytes": 75595776, + "records": [ + { + "name": "param_243", + "shape": [ + 49216, + 384 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 75595776, + "byteOffset": 0 + } + ], + "md5sum": "3fd26837d3b6d618b756bb755cda1b4e" + }, + { + "dataPath": "params_shard_50.bin", + "format": "raw-shard", + "nbytes": 27817984, + "records": [ + { + "name": "param_237", + "shape": [ + 16384, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 3145728, + "byteOffset": 0 + }, + { + "name": "param_238", + "shape": [ + 3072, + 1024 + ], + "dtype": "uint32", + "format": "raw", + "nbytes": 12582912, + "byteOffset": 3145728 + }, + { + "name": "param_239", + "shape": [ + 3072, + 256 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 1572864, + "byteOffset": 15728640 + }, + { + "name": "param_240", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17301504 + }, + { + "name": "param_241", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17307648 + }, + { + "name": "param_242", + "shape": [ + 3072 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 6144, + "byteOffset": 17313792 + }, + { + "name": "param_244", + "shape": [ + 49216, + 96 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 9449472, + "byteOffset": 17319936 + }, + { + "name": "param_245", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 26769408 + }, + { + "name": "param_246", + "shape": [ + 2048, + 128 + ], + "dtype": "float16", + "format": "raw", + "nbytes": 524288, + "byteOffset": 27293696 + } + ], + "md5sum": "5703a84f0113a93f65e213357ebc5125" + } + ] +} \ No newline at end of file diff --git a/params/params_shard_0.bin b/params/params_shard_0.bin new file mode 100644 index 0000000000000000000000000000000000000000..93aa6afdd40317c73ba653497d20efabc7e56167 --- /dev/null +++ b/params/params_shard_0.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0caf48925d559d45ea56008e06dd0386045c3a87fd99a2ccd68c87d6a1adb16c +size 75595776 diff --git a/params/params_shard_1.bin b/params/params_shard_1.bin new file mode 100644 index 0000000000000000000000000000000000000000..d5f6365b5af0d2a291405e70f325760bf83e54b2 --- /dev/null +++ b/params/params_shard_1.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be4180f1dd651a31ecab054ca84f3d9ac1d8c3a2b4060002decc542e3bdf574c +size 25165824 diff --git a/params/params_shard_10.bin b/params/params_shard_10.bin new file mode 100644 index 0000000000000000000000000000000000000000..c752c65d6dfacdd130a74aaf921609f9afec3f91 --- /dev/null +++ b/params/params_shard_10.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a1a4ba16d1487be929512c77d0e9f90ebb0ded887ceb129ff5fed966c01e11 +size 30474240 diff --git a/params/params_shard_11.bin b/params/params_shard_11.bin new file mode 100644 index 0000000000000000000000000000000000000000..674a29d92015cca8f36b21f602e791b5b3e25c20 --- /dev/null +++ b/params/params_shard_11.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fe474254a011af63ea72f90f651988b9f2b6a2e598338e8f60ce5a71a1616a1 +size 33239040 diff --git a/params/params_shard_12.bin b/params/params_shard_12.bin new file mode 100644 index 0000000000000000000000000000000000000000..e4bcffc3af4dd3aadd3b2c2a39af0ef92f290b4d --- /dev/null +++ b/params/params_shard_12.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e84b43e89595b1c94e8f3a3cb9a8ae8329c08ae7fe7ac4db5a3c54dd82e4a7b +size 30474240 diff --git a/params/params_shard_13.bin b/params/params_shard_13.bin new file mode 100644 index 0000000000000000000000000000000000000000..b86e1720beda58e054648f0e323da85102a03ba0 --- /dev/null +++ b/params/params_shard_13.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:321a5d197c848f83b48845ce899fcac43aa69743646aba5ec0eb193c2a8d6fb2 +size 33239040 diff --git a/params/params_shard_14.bin b/params/params_shard_14.bin new file mode 100644 index 0000000000000000000000000000000000000000..be383cf59f80bec9e1417185d5bbc7bee591b329 --- /dev/null +++ b/params/params_shard_14.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3bff37f22d9bc445c7240351b326b36715915a2537a0ccc6faea42c697faf83 +size 30474240 diff --git a/params/params_shard_15.bin b/params/params_shard_15.bin new file mode 100644 index 0000000000000000000000000000000000000000..26a91655364791ae3569a34b0842d47acf706297 --- /dev/null +++ b/params/params_shard_15.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:119d722f35281cc08bcf696906083e75e50fec1f1e37677201f717da065ba9ba +size 33239040 diff --git a/params/params_shard_16.bin b/params/params_shard_16.bin new file mode 100644 index 0000000000000000000000000000000000000000..397025dacd0d36e82b7248cff6ea02d634f9ad60 --- /dev/null +++ b/params/params_shard_16.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:120dd3921fb1102e1fa844e70fe3b60d7718dbb9337ccded4d35d1079f9775e2 +size 30474240 diff --git a/params/params_shard_17.bin b/params/params_shard_17.bin new file mode 100644 index 0000000000000000000000000000000000000000..95f4d7cc523418de195c191ab6df6d814afe18a3 --- /dev/null +++ b/params/params_shard_17.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64b78180a17c1556ab28df9bb45814101e6a41445c7502a82f7478e9e3690790 +size 33239040 diff --git a/params/params_shard_18.bin b/params/params_shard_18.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a0a189c03a923a6a794e6f1e917dbaa9eecfe93 --- /dev/null +++ b/params/params_shard_18.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:356b72f0f831c7d952ac2a049d8ab8067e81069eab0f3682ea68f80032d078dc +size 30474240 diff --git a/params/params_shard_19.bin b/params/params_shard_19.bin new file mode 100644 index 0000000000000000000000000000000000000000..1d9df0e556c4e92d3fc1862bdf2c07d486e2e1a3 --- /dev/null +++ b/params/params_shard_19.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:297ee9af15309ea77d34ea016124500d631c37a4bb6dd7d2375e775a622a8b40 +size 33239040 diff --git a/params/params_shard_2.bin b/params/params_shard_2.bin new file mode 100644 index 0000000000000000000000000000000000000000..bd3b2d29e8cc0e7358600ccd5d32fff9ef642faa --- /dev/null +++ b/params/params_shard_2.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4ad2a9aedd32044da876115bc60c0f99113562933b05609dda72c045d8aa183 +size 30683136 diff --git a/params/params_shard_20.bin b/params/params_shard_20.bin new file mode 100644 index 0000000000000000000000000000000000000000..0e3055130dbb7b572fd1b6567684d11af45cf616 --- /dev/null +++ b/params/params_shard_20.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f985cdfa0b2f2704d4a6a6f0ac3d39e5acc3eb6bed9e68d9d14e2af24d96a6da +size 30474240 diff --git a/params/params_shard_21.bin b/params/params_shard_21.bin new file mode 100644 index 0000000000000000000000000000000000000000..22faf1efc740be2bcfa46e8a28a1ffaa71cedbe5 --- /dev/null +++ b/params/params_shard_21.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a209815fe5bec279be92bc4f1642b922d51e22ba370201f3513ad156523d349 +size 33239040 diff --git a/params/params_shard_22.bin b/params/params_shard_22.bin new file mode 100644 index 0000000000000000000000000000000000000000..bcb1c5752eb02e687d91b8a38b68f6425e74bf63 --- /dev/null +++ b/params/params_shard_22.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7657e75745c898223a1e20a143ba15b10dc6d95b2970c88f807c1b5ec25f3c71 +size 30474240 diff --git a/params/params_shard_23.bin b/params/params_shard_23.bin new file mode 100644 index 0000000000000000000000000000000000000000..b303b72484bf445a7e52d4a9ca842876736bb11c --- /dev/null +++ b/params/params_shard_23.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:871af80b5fb179617bba17dcfa0a5ebb335b728b6df7f4db7ddc78b32b6ce9c6 +size 33239040 diff --git a/params/params_shard_24.bin b/params/params_shard_24.bin new file mode 100644 index 0000000000000000000000000000000000000000..54db760067fb3d957287dce5a275d4042d8c9e85 --- /dev/null +++ b/params/params_shard_24.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a1c9cfbe373441f7d926f48253e56309420cfe6a90a71c4ccf491778646f2b +size 30474240 diff --git a/params/params_shard_25.bin b/params/params_shard_25.bin new file mode 100644 index 0000000000000000000000000000000000000000..707d41335fcda704878807ec46d82b1d5100559c --- /dev/null +++ b/params/params_shard_25.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e8ae18626cf9ceb4eeac399bb9ffa3a301b758aac654bc44f011b5de2110e53 +size 33239040 diff --git a/params/params_shard_26.bin b/params/params_shard_26.bin new file mode 100644 index 0000000000000000000000000000000000000000..e336afa13d6997ba698ea945837ba35f85c92964 --- /dev/null +++ b/params/params_shard_26.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fed0f45c57f45303a982edd969bba27cf13e2043175d5923af8bd42e238be12 +size 30474240 diff --git a/params/params_shard_27.bin b/params/params_shard_27.bin new file mode 100644 index 0000000000000000000000000000000000000000..4293caa3d23e94b92190a05147297213fa0a8a58 --- /dev/null +++ b/params/params_shard_27.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c728d54e6f009d1e61cfd81446ac1c447db26fbb818600430dca819c65e1a800 +size 33239040 diff --git a/params/params_shard_28.bin b/params/params_shard_28.bin new file mode 100644 index 0000000000000000000000000000000000000000..a55d9e96a7214d0bd044d2bd683e9e73f557ad35 --- /dev/null +++ b/params/params_shard_28.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e516688a4fdedaca17b06ead13655c8c52e24cc977e4d2cbd9e58150e570c74 +size 30474240 diff --git a/params/params_shard_29.bin b/params/params_shard_29.bin new file mode 100644 index 0000000000000000000000000000000000000000..ef34d3952cb5ae8ceb7404c3b87956dc99ba0db8 --- /dev/null +++ b/params/params_shard_29.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1c968b723e32fb08892c666a28bd5d4a5be1f4478e3a90fb5ff311b40b1afe +size 33239040 diff --git a/params/params_shard_3.bin b/params/params_shard_3.bin new file mode 100644 index 0000000000000000000000000000000000000000..71e01b125e6c3b9b7ba35b6c9a4aaeda925946d6 --- /dev/null +++ b/params/params_shard_3.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:798f70307ff7f264cb772d377bbd96d3ce0b0380a667eada383e9e8f92670886 +size 33239040 diff --git a/params/params_shard_30.bin b/params/params_shard_30.bin new file mode 100644 index 0000000000000000000000000000000000000000..592934c697f8915e6cc8b403cc4217c42056a75a --- /dev/null +++ b/params/params_shard_30.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa3fa67d55ed83f32fa183cebd5026014b178db4b94a8968feee47aa6157922 +size 30474240 diff --git a/params/params_shard_31.bin b/params/params_shard_31.bin new file mode 100644 index 0000000000000000000000000000000000000000..2749cd333bfbb7138ee079109a9cf3aed21273c8 --- /dev/null +++ b/params/params_shard_31.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a29072b0947d2b1451c5649b9f67d5fbdac9d55a098d7682b02af3263179d00 +size 33239040 diff --git a/params/params_shard_32.bin b/params/params_shard_32.bin new file mode 100644 index 0000000000000000000000000000000000000000..5aa1d9882c7a280dc4f78c5636b3f36fcefe9de0 --- /dev/null +++ b/params/params_shard_32.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d764a0fdb9faeb153c1cf25a0e795a87963adf28f2c5ce30b2df5f3a49df8d2 +size 30474240 diff --git a/params/params_shard_33.bin b/params/params_shard_33.bin new file mode 100644 index 0000000000000000000000000000000000000000..9c7ab8a2944ba0156bf33dfc25c486ee42472faf --- /dev/null +++ b/params/params_shard_33.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a06ab40892dde63b328e1d7190bb933fb21cd4392f22f061dc83dfb83154ad3a +size 33239040 diff --git a/params/params_shard_34.bin b/params/params_shard_34.bin new file mode 100644 index 0000000000000000000000000000000000000000..d3d0771c91891d53c5c9c41e7d578b4b87b8d6b5 --- /dev/null +++ b/params/params_shard_34.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28368c97d8dae349e2ccfdbdbdcfc0bdc4241d1332358f4a7790e9e438254e85 +size 30474240 diff --git a/params/params_shard_35.bin b/params/params_shard_35.bin new file mode 100644 index 0000000000000000000000000000000000000000..131cf8bf7ac84ef131d1431670805010ba1281a8 --- /dev/null +++ b/params/params_shard_35.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9816d110a71deed28c3aa457d4cc99a90ba77194d413cc089e7a80a3706f3cd3 +size 33239040 diff --git a/params/params_shard_36.bin b/params/params_shard_36.bin new file mode 100644 index 0000000000000000000000000000000000000000..8936a8d39a88026ba57b240055c2970bcece2b8d --- /dev/null +++ b/params/params_shard_36.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8da18acfd2d709bb774e291169d9e6bb56ba5acb7698dac5985284ddbd46940 +size 30474240 diff --git a/params/params_shard_37.bin b/params/params_shard_37.bin new file mode 100644 index 0000000000000000000000000000000000000000..e28b031541feac455257515e064ee6219d4da2f8 --- /dev/null +++ b/params/params_shard_37.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30363bdb013d0d9ab1b65172221319421ceecc9851300b516a8d3edb63876fcd +size 33239040 diff --git a/params/params_shard_38.bin b/params/params_shard_38.bin new file mode 100644 index 0000000000000000000000000000000000000000..0a3ee860735392444de4b2d2bd046ddbcd28fae9 --- /dev/null +++ b/params/params_shard_38.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec2b7d9777cab28f22c81abfdb96e0d9a9909c5ca31aa9b1d313c150eb49409 +size 30474240 diff --git a/params/params_shard_39.bin b/params/params_shard_39.bin new file mode 100644 index 0000000000000000000000000000000000000000..ebce4683d00c6c971d4e732d5dffff65b2e572a0 --- /dev/null +++ b/params/params_shard_39.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5af4dbb6b91907a8a50a341fae042f3245b3060ba3021ed9e776e271167c3711 +size 33239040 diff --git a/params/params_shard_4.bin b/params/params_shard_4.bin new file mode 100644 index 0000000000000000000000000000000000000000..e5347f4c1a3ea8f92747f8bc5d532dc8fe966df3 --- /dev/null +++ b/params/params_shard_4.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b64c1fee332205732a44ee123da07ec451c2c2cd630ca7d89bb3c2dda91ae17 +size 30474240 diff --git a/params/params_shard_40.bin b/params/params_shard_40.bin new file mode 100644 index 0000000000000000000000000000000000000000..2031b38aa5c610992fb21f6e89f83f256ed5a980 --- /dev/null +++ b/params/params_shard_40.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df98b68ba04cf44d7dbd6a93eb7e75ed8925d38b3f62ec1be1090a1ba29d28c4 +size 30474240 diff --git a/params/params_shard_41.bin b/params/params_shard_41.bin new file mode 100644 index 0000000000000000000000000000000000000000..477093a6280366f9b60d0e114558e8dca5b1c3bc --- /dev/null +++ b/params/params_shard_41.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b18550de5b27e6f126bdc691e9c52ad6cd7c893e77942cace19d3aeef5f36537 +size 33239040 diff --git a/params/params_shard_42.bin b/params/params_shard_42.bin new file mode 100644 index 0000000000000000000000000000000000000000..fa063db65aa9ba5e27de5312a7b8643b67f16941 --- /dev/null +++ b/params/params_shard_42.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5069df66406c3e1eb38aec32b59c0c4c14c078690b925fe7a60eedd8a7802c20 +size 30474240 diff --git a/params/params_shard_43.bin b/params/params_shard_43.bin new file mode 100644 index 0000000000000000000000000000000000000000..1fff31d567f7508d9e35ee6ea8f47a7dafa69737 --- /dev/null +++ b/params/params_shard_43.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8022e0f117e0ffe2a57ca3cd5d87357dce8c2bee15edc764ee93e0021bb912fc +size 33239040 diff --git a/params/params_shard_44.bin b/params/params_shard_44.bin new file mode 100644 index 0000000000000000000000000000000000000000..c16688593f9c73f720befdabb6e7c34d4cd44b36 --- /dev/null +++ b/params/params_shard_44.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4681fbd23b376b455b97b6c07fd6f21938be64b31c15590802613ed230a060a8 +size 30474240 diff --git a/params/params_shard_45.bin b/params/params_shard_45.bin new file mode 100644 index 0000000000000000000000000000000000000000..1c6267450336021617c90a631d5d4017c682aa9b --- /dev/null +++ b/params/params_shard_45.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d205b22e462a0c5fcb99b9d4e7a1b550b4b7d3414ec46f3620ad65b9e25ceab7 +size 33239040 diff --git a/params/params_shard_46.bin b/params/params_shard_46.bin new file mode 100644 index 0000000000000000000000000000000000000000..099ce7765eeb67f8a578061a5a999202a0071b1d --- /dev/null +++ b/params/params_shard_46.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76393b282df931dc149a5ba719da464ee1e1ef4122043e10b994591270bbd153 +size 30474240 diff --git a/params/params_shard_47.bin b/params/params_shard_47.bin new file mode 100644 index 0000000000000000000000000000000000000000..ea53645bb30bb2acdd2252499002d803ce7c8ae1 --- /dev/null +++ b/params/params_shard_47.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b23f3e7bac75d7f235434659e76f81afd3737d6709797fa1718928c6ee23cd8 +size 33239040 diff --git a/params/params_shard_48.bin b/params/params_shard_48.bin new file mode 100644 index 0000000000000000000000000000000000000000..78f5e2ec91edc87dbf85cffa89aea52b71a8ea2f --- /dev/null +++ b/params/params_shard_48.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d03a2d01dccc152fcecb06f8c92111828caac38993cd0723072f5ca6633a310 +size 30474240 diff --git a/params/params_shard_49.bin b/params/params_shard_49.bin new file mode 100644 index 0000000000000000000000000000000000000000..7964ab08d63681b58041815ed8ff6c930eb4692f --- /dev/null +++ b/params/params_shard_49.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3631b7c8e5315c1e95e6bf02b7e309b5d7329d7c9c73d0272242d7505c2f132 +size 75595776 diff --git a/params/params_shard_5.bin b/params/params_shard_5.bin new file mode 100644 index 0000000000000000000000000000000000000000..cf5c7aea82db98db5eec92f2542a0c5c8ed1dd26 --- /dev/null +++ b/params/params_shard_5.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78fb69b60da961d9d9e50659d9265280db05254e981927ff17967b52551ea45 +size 33239040 diff --git a/params/params_shard_50.bin b/params/params_shard_50.bin new file mode 100644 index 0000000000000000000000000000000000000000..4184bc7896e1e1d9f821d8db4896415fe30189f2 --- /dev/null +++ b/params/params_shard_50.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af9f4b114e16e0ba8fa099b0889887cfc6bfa60a1c2e1894781624e32caac525 +size 27817984 diff --git a/params/params_shard_6.bin b/params/params_shard_6.bin new file mode 100644 index 0000000000000000000000000000000000000000..7dd9359f29221a0a90532efd31461489abb586cc --- /dev/null +++ b/params/params_shard_6.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:359c7702b6fb0cbbc0660fe1c59a91ac5861da8473f5a66b31ed10b8816ed7d0 +size 30474240 diff --git a/params/params_shard_7.bin b/params/params_shard_7.bin new file mode 100644 index 0000000000000000000000000000000000000000..95ffb84f06aa3ffbb7a5197c0163e133deff8d87 --- /dev/null +++ b/params/params_shard_7.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e73af4995bc5183b2701e827400d637d5a0662633fcfeda23a326e0ee2cf647 +size 33239040 diff --git a/params/params_shard_8.bin b/params/params_shard_8.bin new file mode 100644 index 0000000000000000000000000000000000000000..1be3d03ed258a8a22163d873d9bf21dc038c016b --- /dev/null +++ b/params/params_shard_8.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510bd24e72c9fa5defdaede0f725ded1f1d06cb5aeff4bb8505f7083117c793a +size 30474240 diff --git a/params/params_shard_9.bin b/params/params_shard_9.bin new file mode 100644 index 0000000000000000000000000000000000000000..5dd1547fe75d483af016b20ee8a52b42145052a8 --- /dev/null +++ b/params/params_shard_9.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eacd5601d1ea7d7c4231907a00803ff5a076f65e4a29cb60368c1b74742e3f5b +size 33239040 diff --git a/params/tokenizer.model b/params/tokenizer.model new file mode 100644 index 0000000000000000000000000000000000000000..14cb1e69f41eba3bba66ff8215b1de01e273f42b --- /dev/null +++ b/params/tokenizer.model @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae87c0db2b21b0fa3fdc5e19d1f9cea94efb703cc7c6281d8718a6714b3cc2be +size 748869 diff --git a/params/tokenizer_config.json b/params/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c55a3f9810e9f356a7c3d6b3fcd68f6af98357c9 --- /dev/null +++ b/params/tokenizer_config.json @@ -0,0 +1,37 @@ +{ + "add_bos_token": true, + "add_eos_token": false, + "bos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "clean_up_tokenization_spaces": false, + "eos_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "legacy": null, + "model_max_length": 1000000000000000019884624838656, + "pad_token": null, + "sp_model_kwargs": {}, + "spaces_between_special_tokens": false, + "tokenizer_class": "LlamaTokenizer", + "unk_token": { + "__type": "AddedToken", + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, + "use_default_system_prompt": true, + "use_fast": true +}