diff --git a/.gitattributes b/.gitattributes
index a6344aac8c09253b3b630fb776ae94478aa0275b..52b264d3f421335397ffaf36aba6ee4d3a211b59 100644
--- a/.gitattributes
+++ b/.gitattributes
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
*.zip filter=lfs diff=lfs merge=lfs -text
*.zst filter=lfs diff=lfs merge=lfs -text
*tfevents* filter=lfs diff=lfs merge=lfs -text
+*.so filter=lfs diff=lfs merge=lfs -text
+*.dll filter=lfs diff=lfs merge=lfs -text
+*.lib filter=lfs diff=lfs merge=lfs -text
diff --git a/MiniChat-1.5-3B-q4f16_1-vulkan.dll b/MiniChat-1.5-3B-q4f16_1-vulkan.dll
new file mode 100644
index 0000000000000000000000000000000000000000..a3a97889aa61c7c5fbfcbef22568f1852007af60
--- /dev/null
+++ b/MiniChat-1.5-3B-q4f16_1-vulkan.dll
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be81332f4249e7fcc4fff237d988064112d77280f06a6ced02a35232c932d90c
+size 26675712
diff --git a/MiniChat-1.5-3B-q4f16_1-vulkan.exp b/MiniChat-1.5-3B-q4f16_1-vulkan.exp
new file mode 100644
index 0000000000000000000000000000000000000000..392890074d066c4e2feeb6903b4edfee5990ae35
Binary files /dev/null and b/MiniChat-1.5-3B-q4f16_1-vulkan.exp differ
diff --git a/MiniChat-1.5-3B-q4f16_1-vulkan.lib b/MiniChat-1.5-3B-q4f16_1-vulkan.lib
new file mode 100644
index 0000000000000000000000000000000000000000..f9b1d3fd98070b0a88d67a87d240e67dfafab7c1
--- /dev/null
+++ b/MiniChat-1.5-3B-q4f16_1-vulkan.lib
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9ea706f1d92d34e752c22794cde07923436f6c807ac8cd1bdb0136d44b842245
+size 14110
diff --git a/params/mlc-chat-config.json b/params/mlc-chat-config.json
new file mode 100644
index 0000000000000000000000000000000000000000..777f3d51ab87c37311b4a4e2401990167dd6e2f6
--- /dev/null
+++ b/params/mlc-chat-config.json
@@ -0,0 +1,21 @@
+{
+ "model_lib": "MiniChat-1.5-3B-q4f16_1",
+ "local_id": "MiniChat-1.5-3B-q4f16_1",
+ "conv_template": "llama_default",
+ "temperature": 0.7,
+ "repetition_penalty": 1.0,
+ "top_p": 0.95,
+ "mean_gen_len": 128,
+ "max_gen_len": 4096,
+ "num_shards": 1,
+ "use_presharded_weights": false,
+ "shift_fill_factor": 0.3,
+ "tokenizer_files": [
+ "tokenizer.model"
+ ],
+ "model_category": "llama",
+ "model_name": "MiniChat-1.5-3B",
+ "vocab_size": 49216,
+ "prefill_chunk_size": -1,
+ "max_window_size": 4096
+}
\ No newline at end of file
diff --git a/params/ndarray-cache.json b/params/ndarray-cache.json
new file mode 100644
index 0000000000000000000000000000000000000000..9cbbb52f11a941661db7f9fd6994e280ed54a111
--- /dev/null
+++ b/params/ndarray-cache.json
@@ -0,0 +1,3083 @@
+{
+ "metadata": {
+ "ParamSize": 247
+ },
+ "records": [
+ {
+ "dataPath": "params_shard_0.bin",
+ "format": "raw-shard",
+ "nbytes": 75595776,
+ "records": [
+ {
+ "name": "param_0",
+ "shape": [
+ 49216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 75595776,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "ecf15d3f0901ab7456e8e0af8ced507c"
+ },
+ {
+ "dataPath": "params_shard_1.bin",
+ "format": "raw-shard",
+ "nbytes": 25165824,
+ "records": [
+ {
+ "name": "param_6",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "9bbebd6e9fb88198483ac084144d55a6"
+ },
+ {
+ "dataPath": "params_shard_2.bin",
+ "format": "raw-shard",
+ "nbytes": 30683136,
+ "records": [
+ {
+ "name": "param_1",
+ "shape": [
+ 49216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 9449472,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_2",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 9449472
+ },
+ {
+ "name": "param_3",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 23605248
+ },
+ {
+ "name": "param_4",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 25374720
+ },
+ {
+ "name": "param_5",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 30093312
+ }
+ ],
+ "md5sum": "2e5970708026d9b687364767425202cb"
+ },
+ {
+ "dataPath": "params_shard_3.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_7",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_8",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_9",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_10",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_11",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_12",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_13",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "9f934199d76c5d26646f3d545ab72fff"
+ },
+ {
+ "dataPath": "params_shard_4.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_14",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_15",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_16",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "a3cb6df79e4429abc2be010fedfc51d1"
+ },
+ {
+ "dataPath": "params_shard_5.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_17",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_18",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_19",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_20",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_21",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_22",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_23",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "abf83c3c7e851bb5767f197da8cb1dac"
+ },
+ {
+ "dataPath": "params_shard_6.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_24",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_25",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_26",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "6ce898064ed0861322bbf62e9d70d729"
+ },
+ {
+ "dataPath": "params_shard_7.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_27",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_28",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_29",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_30",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_31",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_32",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_33",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "172bd66af74d0e34491ae5bb801be91a"
+ },
+ {
+ "dataPath": "params_shard_8.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_34",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_35",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_36",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "80622e63178dc3e00ced75b53b23fd35"
+ },
+ {
+ "dataPath": "params_shard_9.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_37",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_38",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_39",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_40",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_41",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_42",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_43",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "1b105ec9d866d775cb69379c40757f88"
+ },
+ {
+ "dataPath": "params_shard_10.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_44",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_45",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_46",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "8ca5fd22e33b7ecfc4edb22c2429bea0"
+ },
+ {
+ "dataPath": "params_shard_11.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_47",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_48",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_49",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_50",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_51",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_52",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_53",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "33dbf522d5e71a2c9c80bba1cd630861"
+ },
+ {
+ "dataPath": "params_shard_12.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_54",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_55",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_56",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "ffc57c8bae42beb9ca8bd2f58a9e4b90"
+ },
+ {
+ "dataPath": "params_shard_13.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_57",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_58",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_59",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_60",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_61",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_62",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_63",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "7000c9ae4c55bccc6d8d4ff1cbfd6543"
+ },
+ {
+ "dataPath": "params_shard_14.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_64",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_65",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_66",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "948f3bbf1c76842dde7f1b9831212144"
+ },
+ {
+ "dataPath": "params_shard_15.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_67",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_68",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_69",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_70",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_71",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_72",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_73",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "32bec1a6997ffbfd0ab9e93f56b9ad87"
+ },
+ {
+ "dataPath": "params_shard_16.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_74",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_75",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_76",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "8711c6302582fddaa4c9e7ed91a75c7b"
+ },
+ {
+ "dataPath": "params_shard_17.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_77",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_78",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_79",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_80",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_81",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_82",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_83",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "29147a956d8177b8d4b5c57754a7d670"
+ },
+ {
+ "dataPath": "params_shard_18.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_84",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_85",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_86",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "1471ebee434c1147a18f440f09f98e91"
+ },
+ {
+ "dataPath": "params_shard_19.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_87",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_88",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_89",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_90",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_91",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_92",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_93",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "0e32a9c897b51680f461e8b1008f5701"
+ },
+ {
+ "dataPath": "params_shard_20.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_94",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_95",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_96",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "e26e42c69c260b3bb2ab55694b1482fa"
+ },
+ {
+ "dataPath": "params_shard_21.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_97",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_98",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_99",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_100",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_101",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_102",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_103",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "ae647c3f3d6a097e5470cf69248d3a63"
+ },
+ {
+ "dataPath": "params_shard_22.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_104",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_105",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_106",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "871acb8160143ca04a5347cc79ec7885"
+ },
+ {
+ "dataPath": "params_shard_23.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_107",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_108",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_109",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_110",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_111",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_112",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_113",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "a98b06905334de6643492605ed0fa08f"
+ },
+ {
+ "dataPath": "params_shard_24.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_114",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_115",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_116",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "a7627fcb0b8897ad5b778e2bfb633481"
+ },
+ {
+ "dataPath": "params_shard_25.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_117",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_118",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_119",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_120",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_121",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_122",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_123",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "cc15fd71e7ae435df5d24ac8efc7914b"
+ },
+ {
+ "dataPath": "params_shard_26.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_124",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_125",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_126",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "871cb0c0da0bd2b0fa86f5bd027f7cd4"
+ },
+ {
+ "dataPath": "params_shard_27.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_127",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_128",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_129",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_130",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_131",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_132",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_133",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "1372630bf1cc3c793393c4caa9676037"
+ },
+ {
+ "dataPath": "params_shard_28.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_134",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_135",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_136",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "384bce670c71430046a8c55f604dd2be"
+ },
+ {
+ "dataPath": "params_shard_29.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_137",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_138",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_139",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_140",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_141",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_142",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_143",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "c88b13da2066d10551cebd5ab92a2ce0"
+ },
+ {
+ "dataPath": "params_shard_30.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_144",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_145",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_146",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "810e6f3b5ab150f4900dd1022ab0a40f"
+ },
+ {
+ "dataPath": "params_shard_31.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_147",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_148",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_149",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_150",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_151",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_152",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_153",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "7831b6ba62b41e173d6a10fa2505a728"
+ },
+ {
+ "dataPath": "params_shard_32.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_154",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_155",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_156",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "46f5b5049ec0bd2f0244115053cb08f1"
+ },
+ {
+ "dataPath": "params_shard_33.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_157",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_158",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_159",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_160",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_161",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_162",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_163",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "d35e67cff788996fcbb377a37c2988e1"
+ },
+ {
+ "dataPath": "params_shard_34.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_164",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_165",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_166",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "b773d61b73cbac065381e20361f4367d"
+ },
+ {
+ "dataPath": "params_shard_35.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_167",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_168",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_169",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_170",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_171",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_172",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_173",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "26e5ed8698a8e8652345ff38879bd502"
+ },
+ {
+ "dataPath": "params_shard_36.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_174",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_175",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_176",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "7c8d29c2e7398736627702453541c286"
+ },
+ {
+ "dataPath": "params_shard_37.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_177",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_178",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_179",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_180",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_181",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_182",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_183",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "662ba7267d5620fd903802819eeb9788"
+ },
+ {
+ "dataPath": "params_shard_38.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_184",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_185",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_186",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "7fca258deddd082906005d8c6b594562"
+ },
+ {
+ "dataPath": "params_shard_39.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_187",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_188",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_189",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_190",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_191",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_192",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_193",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "5bf417a7fac3087ed714131189075816"
+ },
+ {
+ "dataPath": "params_shard_40.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_194",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_195",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_196",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "c82817e7f5c165463d841e9a9c842997"
+ },
+ {
+ "dataPath": "params_shard_41.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_197",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_198",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_199",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_200",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_201",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_202",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_203",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "b05284a92d345b891b61d066f50d565b"
+ },
+ {
+ "dataPath": "params_shard_42.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_204",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_205",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_206",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "bfd684dbf1519a513ace0f048c2a39be"
+ },
+ {
+ "dataPath": "params_shard_43.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_207",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_208",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_209",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_210",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_211",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_212",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_213",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "815087a3375fae098120207cf73606b6"
+ },
+ {
+ "dataPath": "params_shard_44.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_214",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_215",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_216",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "5065ca3fd598a6582c10353f8a48f235"
+ },
+ {
+ "dataPath": "params_shard_45.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_217",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_218",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_219",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_220",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_221",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_222",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_223",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "bdb40b4e92059de1100895fd5336fb7c"
+ },
+ {
+ "dataPath": "params_shard_46.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_224",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_225",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_226",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "7a8e6878b7e620871f7b65301ec72550"
+ },
+ {
+ "dataPath": "params_shard_47.bin",
+ "format": "raw-shard",
+ "nbytes": 33239040,
+ "records": [
+ {
+ "name": "param_227",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_228",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_229",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_230",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_231",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_232",
+ "shape": [
+ 9216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 14155776,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_233",
+ "shape": [
+ 9216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1769472,
+ "byteOffset": 31469568
+ }
+ ],
+ "md5sum": "c4867c41c853d1d3c30bc04aa840956b"
+ },
+ {
+ "dataPath": "params_shard_48.bin",
+ "format": "raw-shard",
+ "nbytes": 30474240,
+ "records": [
+ {
+ "name": "param_234",
+ "shape": [
+ 3072,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 4718592,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_235",
+ "shape": [
+ 3072,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 589824,
+ "byteOffset": 4718592
+ },
+ {
+ "name": "param_236",
+ "shape": [
+ 16384,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 25165824,
+ "byteOffset": 5308416
+ }
+ ],
+ "md5sum": "a80e5c1d5f2df058f023a47d703174a3"
+ },
+ {
+ "dataPath": "params_shard_49.bin",
+ "format": "raw-shard",
+ "nbytes": 75595776,
+ "records": [
+ {
+ "name": "param_243",
+ "shape": [
+ 49216,
+ 384
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 75595776,
+ "byteOffset": 0
+ }
+ ],
+ "md5sum": "3fd26837d3b6d618b756bb755cda1b4e"
+ },
+ {
+ "dataPath": "params_shard_50.bin",
+ "format": "raw-shard",
+ "nbytes": 27817984,
+ "records": [
+ {
+ "name": "param_237",
+ "shape": [
+ 16384,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 3145728,
+ "byteOffset": 0
+ },
+ {
+ "name": "param_238",
+ "shape": [
+ 3072,
+ 1024
+ ],
+ "dtype": "uint32",
+ "format": "raw",
+ "nbytes": 12582912,
+ "byteOffset": 3145728
+ },
+ {
+ "name": "param_239",
+ "shape": [
+ 3072,
+ 256
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 1572864,
+ "byteOffset": 15728640
+ },
+ {
+ "name": "param_240",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17301504
+ },
+ {
+ "name": "param_241",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17307648
+ },
+ {
+ "name": "param_242",
+ "shape": [
+ 3072
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 6144,
+ "byteOffset": 17313792
+ },
+ {
+ "name": "param_244",
+ "shape": [
+ 49216,
+ 96
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 9449472,
+ "byteOffset": 17319936
+ },
+ {
+ "name": "param_245",
+ "shape": [
+ 2048,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 524288,
+ "byteOffset": 26769408
+ },
+ {
+ "name": "param_246",
+ "shape": [
+ 2048,
+ 128
+ ],
+ "dtype": "float16",
+ "format": "raw",
+ "nbytes": 524288,
+ "byteOffset": 27293696
+ }
+ ],
+ "md5sum": "5703a84f0113a93f65e213357ebc5125"
+ }
+ ]
+}
\ No newline at end of file
diff --git a/params/params_shard_0.bin b/params/params_shard_0.bin
new file mode 100644
index 0000000000000000000000000000000000000000..93aa6afdd40317c73ba653497d20efabc7e56167
--- /dev/null
+++ b/params/params_shard_0.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0caf48925d559d45ea56008e06dd0386045c3a87fd99a2ccd68c87d6a1adb16c
+size 75595776
diff --git a/params/params_shard_1.bin b/params/params_shard_1.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d5f6365b5af0d2a291405e70f325760bf83e54b2
--- /dev/null
+++ b/params/params_shard_1.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:be4180f1dd651a31ecab054ca84f3d9ac1d8c3a2b4060002decc542e3bdf574c
+size 25165824
diff --git a/params/params_shard_10.bin b/params/params_shard_10.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c752c65d6dfacdd130a74aaf921609f9afec3f91
--- /dev/null
+++ b/params/params_shard_10.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:69a1a4ba16d1487be929512c77d0e9f90ebb0ded887ceb129ff5fed966c01e11
+size 30474240
diff --git a/params/params_shard_11.bin b/params/params_shard_11.bin
new file mode 100644
index 0000000000000000000000000000000000000000..674a29d92015cca8f36b21f602e791b5b3e25c20
--- /dev/null
+++ b/params/params_shard_11.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1fe474254a011af63ea72f90f651988b9f2b6a2e598338e8f60ce5a71a1616a1
+size 33239040
diff --git a/params/params_shard_12.bin b/params/params_shard_12.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e4bcffc3af4dd3aadd3b2c2a39af0ef92f290b4d
--- /dev/null
+++ b/params/params_shard_12.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e84b43e89595b1c94e8f3a3cb9a8ae8329c08ae7fe7ac4db5a3c54dd82e4a7b
+size 30474240
diff --git a/params/params_shard_13.bin b/params/params_shard_13.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b86e1720beda58e054648f0e323da85102a03ba0
--- /dev/null
+++ b/params/params_shard_13.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:321a5d197c848f83b48845ce899fcac43aa69743646aba5ec0eb193c2a8d6fb2
+size 33239040
diff --git a/params/params_shard_14.bin b/params/params_shard_14.bin
new file mode 100644
index 0000000000000000000000000000000000000000..be383cf59f80bec9e1417185d5bbc7bee591b329
--- /dev/null
+++ b/params/params_shard_14.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d3bff37f22d9bc445c7240351b326b36715915a2537a0ccc6faea42c697faf83
+size 30474240
diff --git a/params/params_shard_15.bin b/params/params_shard_15.bin
new file mode 100644
index 0000000000000000000000000000000000000000..26a91655364791ae3569a34b0842d47acf706297
--- /dev/null
+++ b/params/params_shard_15.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:119d722f35281cc08bcf696906083e75e50fec1f1e37677201f717da065ba9ba
+size 33239040
diff --git a/params/params_shard_16.bin b/params/params_shard_16.bin
new file mode 100644
index 0000000000000000000000000000000000000000..397025dacd0d36e82b7248cff6ea02d634f9ad60
--- /dev/null
+++ b/params/params_shard_16.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:120dd3921fb1102e1fa844e70fe3b60d7718dbb9337ccded4d35d1079f9775e2
+size 30474240
diff --git a/params/params_shard_17.bin b/params/params_shard_17.bin
new file mode 100644
index 0000000000000000000000000000000000000000..95f4d7cc523418de195c191ab6df6d814afe18a3
--- /dev/null
+++ b/params/params_shard_17.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:64b78180a17c1556ab28df9bb45814101e6a41445c7502a82f7478e9e3690790
+size 33239040
diff --git a/params/params_shard_18.bin b/params/params_shard_18.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0a0a189c03a923a6a794e6f1e917dbaa9eecfe93
--- /dev/null
+++ b/params/params_shard_18.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:356b72f0f831c7d952ac2a049d8ab8067e81069eab0f3682ea68f80032d078dc
+size 30474240
diff --git a/params/params_shard_19.bin b/params/params_shard_19.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1d9df0e556c4e92d3fc1862bdf2c07d486e2e1a3
--- /dev/null
+++ b/params/params_shard_19.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:297ee9af15309ea77d34ea016124500d631c37a4bb6dd7d2375e775a622a8b40
+size 33239040
diff --git a/params/params_shard_2.bin b/params/params_shard_2.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bd3b2d29e8cc0e7358600ccd5d32fff9ef642faa
--- /dev/null
+++ b/params/params_shard_2.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d4ad2a9aedd32044da876115bc60c0f99113562933b05609dda72c045d8aa183
+size 30683136
diff --git a/params/params_shard_20.bin b/params/params_shard_20.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0e3055130dbb7b572fd1b6567684d11af45cf616
--- /dev/null
+++ b/params/params_shard_20.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f985cdfa0b2f2704d4a6a6f0ac3d39e5acc3eb6bed9e68d9d14e2af24d96a6da
+size 30474240
diff --git a/params/params_shard_21.bin b/params/params_shard_21.bin
new file mode 100644
index 0000000000000000000000000000000000000000..22faf1efc740be2bcfa46e8a28a1ffaa71cedbe5
--- /dev/null
+++ b/params/params_shard_21.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5a209815fe5bec279be92bc4f1642b922d51e22ba370201f3513ad156523d349
+size 33239040
diff --git a/params/params_shard_22.bin b/params/params_shard_22.bin
new file mode 100644
index 0000000000000000000000000000000000000000..bcb1c5752eb02e687d91b8a38b68f6425e74bf63
--- /dev/null
+++ b/params/params_shard_22.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7657e75745c898223a1e20a143ba15b10dc6d95b2970c88f807c1b5ec25f3c71
+size 30474240
diff --git a/params/params_shard_23.bin b/params/params_shard_23.bin
new file mode 100644
index 0000000000000000000000000000000000000000..b303b72484bf445a7e52d4a9ca842876736bb11c
--- /dev/null
+++ b/params/params_shard_23.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:871af80b5fb179617bba17dcfa0a5ebb335b728b6df7f4db7ddc78b32b6ce9c6
+size 33239040
diff --git a/params/params_shard_24.bin b/params/params_shard_24.bin
new file mode 100644
index 0000000000000000000000000000000000000000..54db760067fb3d957287dce5a275d4042d8c9e85
--- /dev/null
+++ b/params/params_shard_24.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a6a1c9cfbe373441f7d926f48253e56309420cfe6a90a71c4ccf491778646f2b
+size 30474240
diff --git a/params/params_shard_25.bin b/params/params_shard_25.bin
new file mode 100644
index 0000000000000000000000000000000000000000..707d41335fcda704878807ec46d82b1d5100559c
--- /dev/null
+++ b/params/params_shard_25.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8e8ae18626cf9ceb4eeac399bb9ffa3a301b758aac654bc44f011b5de2110e53
+size 33239040
diff --git a/params/params_shard_26.bin b/params/params_shard_26.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e336afa13d6997ba698ea945837ba35f85c92964
--- /dev/null
+++ b/params/params_shard_26.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7fed0f45c57f45303a982edd969bba27cf13e2043175d5923af8bd42e238be12
+size 30474240
diff --git a/params/params_shard_27.bin b/params/params_shard_27.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4293caa3d23e94b92190a05147297213fa0a8a58
--- /dev/null
+++ b/params/params_shard_27.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:c728d54e6f009d1e61cfd81446ac1c447db26fbb818600430dca819c65e1a800
+size 33239040
diff --git a/params/params_shard_28.bin b/params/params_shard_28.bin
new file mode 100644
index 0000000000000000000000000000000000000000..a55d9e96a7214d0bd044d2bd683e9e73f557ad35
--- /dev/null
+++ b/params/params_shard_28.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9e516688a4fdedaca17b06ead13655c8c52e24cc977e4d2cbd9e58150e570c74
+size 30474240
diff --git a/params/params_shard_29.bin b/params/params_shard_29.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ef34d3952cb5ae8ceb7404c3b87956dc99ba0db8
--- /dev/null
+++ b/params/params_shard_29.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae1c968b723e32fb08892c666a28bd5d4a5be1f4478e3a90fb5ff311b40b1afe
+size 33239040
diff --git a/params/params_shard_3.bin b/params/params_shard_3.bin
new file mode 100644
index 0000000000000000000000000000000000000000..71e01b125e6c3b9b7ba35b6c9a4aaeda925946d6
--- /dev/null
+++ b/params/params_shard_3.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:798f70307ff7f264cb772d377bbd96d3ce0b0380a667eada383e9e8f92670886
+size 33239040
diff --git a/params/params_shard_30.bin b/params/params_shard_30.bin
new file mode 100644
index 0000000000000000000000000000000000000000..592934c697f8915e6cc8b403cc4217c42056a75a
--- /dev/null
+++ b/params/params_shard_30.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5fa3fa67d55ed83f32fa183cebd5026014b178db4b94a8968feee47aa6157922
+size 30474240
diff --git a/params/params_shard_31.bin b/params/params_shard_31.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2749cd333bfbb7138ee079109a9cf3aed21273c8
--- /dev/null
+++ b/params/params_shard_31.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7a29072b0947d2b1451c5649b9f67d5fbdac9d55a098d7682b02af3263179d00
+size 33239040
diff --git a/params/params_shard_32.bin b/params/params_shard_32.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5aa1d9882c7a280dc4f78c5636b3f36fcefe9de0
--- /dev/null
+++ b/params/params_shard_32.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7d764a0fdb9faeb153c1cf25a0e795a87963adf28f2c5ce30b2df5f3a49df8d2
+size 30474240
diff --git a/params/params_shard_33.bin b/params/params_shard_33.bin
new file mode 100644
index 0000000000000000000000000000000000000000..9c7ab8a2944ba0156bf33dfc25c486ee42472faf
--- /dev/null
+++ b/params/params_shard_33.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a06ab40892dde63b328e1d7190bb933fb21cd4392f22f061dc83dfb83154ad3a
+size 33239040
diff --git a/params/params_shard_34.bin b/params/params_shard_34.bin
new file mode 100644
index 0000000000000000000000000000000000000000..d3d0771c91891d53c5c9c41e7d578b4b87b8d6b5
--- /dev/null
+++ b/params/params_shard_34.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:28368c97d8dae349e2ccfdbdbdcfc0bdc4241d1332358f4a7790e9e438254e85
+size 30474240
diff --git a/params/params_shard_35.bin b/params/params_shard_35.bin
new file mode 100644
index 0000000000000000000000000000000000000000..131cf8bf7ac84ef131d1431670805010ba1281a8
--- /dev/null
+++ b/params/params_shard_35.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9816d110a71deed28c3aa457d4cc99a90ba77194d413cc089e7a80a3706f3cd3
+size 33239040
diff --git a/params/params_shard_36.bin b/params/params_shard_36.bin
new file mode 100644
index 0000000000000000000000000000000000000000..8936a8d39a88026ba57b240055c2970bcece2b8d
--- /dev/null
+++ b/params/params_shard_36.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a8da18acfd2d709bb774e291169d9e6bb56ba5acb7698dac5985284ddbd46940
+size 30474240
diff --git a/params/params_shard_37.bin b/params/params_shard_37.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e28b031541feac455257515e064ee6219d4da2f8
--- /dev/null
+++ b/params/params_shard_37.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:30363bdb013d0d9ab1b65172221319421ceecc9851300b516a8d3edb63876fcd
+size 33239040
diff --git a/params/params_shard_38.bin b/params/params_shard_38.bin
new file mode 100644
index 0000000000000000000000000000000000000000..0a3ee860735392444de4b2d2bd046ddbcd28fae9
--- /dev/null
+++ b/params/params_shard_38.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:cec2b7d9777cab28f22c81abfdb96e0d9a9909c5ca31aa9b1d313c150eb49409
+size 30474240
diff --git a/params/params_shard_39.bin b/params/params_shard_39.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ebce4683d00c6c971d4e732d5dffff65b2e572a0
--- /dev/null
+++ b/params/params_shard_39.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5af4dbb6b91907a8a50a341fae042f3245b3060ba3021ed9e776e271167c3711
+size 33239040
diff --git a/params/params_shard_4.bin b/params/params_shard_4.bin
new file mode 100644
index 0000000000000000000000000000000000000000..e5347f4c1a3ea8f92747f8bc5d532dc8fe966df3
--- /dev/null
+++ b/params/params_shard_4.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1b64c1fee332205732a44ee123da07ec451c2c2cd630ca7d89bb3c2dda91ae17
+size 30474240
diff --git a/params/params_shard_40.bin b/params/params_shard_40.bin
new file mode 100644
index 0000000000000000000000000000000000000000..2031b38aa5c610992fb21f6e89f83f256ed5a980
--- /dev/null
+++ b/params/params_shard_40.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:df98b68ba04cf44d7dbd6a93eb7e75ed8925d38b3f62ec1be1090a1ba29d28c4
+size 30474240
diff --git a/params/params_shard_41.bin b/params/params_shard_41.bin
new file mode 100644
index 0000000000000000000000000000000000000000..477093a6280366f9b60d0e114558e8dca5b1c3bc
--- /dev/null
+++ b/params/params_shard_41.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b18550de5b27e6f126bdc691e9c52ad6cd7c893e77942cace19d3aeef5f36537
+size 33239040
diff --git a/params/params_shard_42.bin b/params/params_shard_42.bin
new file mode 100644
index 0000000000000000000000000000000000000000..fa063db65aa9ba5e27de5312a7b8643b67f16941
--- /dev/null
+++ b/params/params_shard_42.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5069df66406c3e1eb38aec32b59c0c4c14c078690b925fe7a60eedd8a7802c20
+size 30474240
diff --git a/params/params_shard_43.bin b/params/params_shard_43.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1fff31d567f7508d9e35ee6ea8f47a7dafa69737
--- /dev/null
+++ b/params/params_shard_43.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8022e0f117e0ffe2a57ca3cd5d87357dce8c2bee15edc764ee93e0021bb912fc
+size 33239040
diff --git a/params/params_shard_44.bin b/params/params_shard_44.bin
new file mode 100644
index 0000000000000000000000000000000000000000..c16688593f9c73f720befdabb6e7c34d4cd44b36
--- /dev/null
+++ b/params/params_shard_44.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4681fbd23b376b455b97b6c07fd6f21938be64b31c15590802613ed230a060a8
+size 30474240
diff --git a/params/params_shard_45.bin b/params/params_shard_45.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1c6267450336021617c90a631d5d4017c682aa9b
--- /dev/null
+++ b/params/params_shard_45.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:d205b22e462a0c5fcb99b9d4e7a1b550b4b7d3414ec46f3620ad65b9e25ceab7
+size 33239040
diff --git a/params/params_shard_46.bin b/params/params_shard_46.bin
new file mode 100644
index 0000000000000000000000000000000000000000..099ce7765eeb67f8a578061a5a999202a0071b1d
--- /dev/null
+++ b/params/params_shard_46.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:76393b282df931dc149a5ba719da464ee1e1ef4122043e10b994591270bbd153
+size 30474240
diff --git a/params/params_shard_47.bin b/params/params_shard_47.bin
new file mode 100644
index 0000000000000000000000000000000000000000..ea53645bb30bb2acdd2252499002d803ce7c8ae1
--- /dev/null
+++ b/params/params_shard_47.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:4b23f3e7bac75d7f235434659e76f81afd3737d6709797fa1718928c6ee23cd8
+size 33239040
diff --git a/params/params_shard_48.bin b/params/params_shard_48.bin
new file mode 100644
index 0000000000000000000000000000000000000000..78f5e2ec91edc87dbf85cffa89aea52b71a8ea2f
--- /dev/null
+++ b/params/params_shard_48.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5d03a2d01dccc152fcecb06f8c92111828caac38993cd0723072f5ca6633a310
+size 30474240
diff --git a/params/params_shard_49.bin b/params/params_shard_49.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7964ab08d63681b58041815ed8ff6c930eb4692f
--- /dev/null
+++ b/params/params_shard_49.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:f3631b7c8e5315c1e95e6bf02b7e309b5d7329d7c9c73d0272242d7505c2f132
+size 75595776
diff --git a/params/params_shard_5.bin b/params/params_shard_5.bin
new file mode 100644
index 0000000000000000000000000000000000000000..cf5c7aea82db98db5eec92f2542a0c5c8ed1dd26
--- /dev/null
+++ b/params/params_shard_5.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:a78fb69b60da961d9d9e50659d9265280db05254e981927ff17967b52551ea45
+size 33239040
diff --git a/params/params_shard_50.bin b/params/params_shard_50.bin
new file mode 100644
index 0000000000000000000000000000000000000000..4184bc7896e1e1d9f821d8db4896415fe30189f2
--- /dev/null
+++ b/params/params_shard_50.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:af9f4b114e16e0ba8fa099b0889887cfc6bfa60a1c2e1894781624e32caac525
+size 27817984
diff --git a/params/params_shard_6.bin b/params/params_shard_6.bin
new file mode 100644
index 0000000000000000000000000000000000000000..7dd9359f29221a0a90532efd31461489abb586cc
--- /dev/null
+++ b/params/params_shard_6.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:359c7702b6fb0cbbc0660fe1c59a91ac5861da8473f5a66b31ed10b8816ed7d0
+size 30474240
diff --git a/params/params_shard_7.bin b/params/params_shard_7.bin
new file mode 100644
index 0000000000000000000000000000000000000000..95ffb84f06aa3ffbb7a5197c0163e133deff8d87
--- /dev/null
+++ b/params/params_shard_7.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:1e73af4995bc5183b2701e827400d637d5a0662633fcfeda23a326e0ee2cf647
+size 33239040
diff --git a/params/params_shard_8.bin b/params/params_shard_8.bin
new file mode 100644
index 0000000000000000000000000000000000000000..1be3d03ed258a8a22163d873d9bf21dc038c016b
--- /dev/null
+++ b/params/params_shard_8.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:510bd24e72c9fa5defdaede0f725ded1f1d06cb5aeff4bb8505f7083117c793a
+size 30474240
diff --git a/params/params_shard_9.bin b/params/params_shard_9.bin
new file mode 100644
index 0000000000000000000000000000000000000000..5dd1547fe75d483af016b20ee8a52b42145052a8
--- /dev/null
+++ b/params/params_shard_9.bin
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:eacd5601d1ea7d7c4231907a00803ff5a076f65e4a29cb60368c1b74742e3f5b
+size 33239040
diff --git a/params/tokenizer.model b/params/tokenizer.model
new file mode 100644
index 0000000000000000000000000000000000000000..14cb1e69f41eba3bba66ff8215b1de01e273f42b
--- /dev/null
+++ b/params/tokenizer.model
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ae87c0db2b21b0fa3fdc5e19d1f9cea94efb703cc7c6281d8718a6714b3cc2be
+size 748869
diff --git a/params/tokenizer_config.json b/params/tokenizer_config.json
new file mode 100644
index 0000000000000000000000000000000000000000..c55a3f9810e9f356a7c3d6b3fcd68f6af98357c9
--- /dev/null
+++ b/params/tokenizer_config.json
@@ -0,0 +1,37 @@
+{
+ "add_bos_token": true,
+ "add_eos_token": false,
+ "bos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "clean_up_tokenization_spaces": false,
+ "eos_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "legacy": null,
+ "model_max_length": 1000000000000000019884624838656,
+ "pad_token": null,
+ "sp_model_kwargs": {},
+ "spaces_between_special_tokens": false,
+ "tokenizer_class": "LlamaTokenizer",
+ "unk_token": {
+ "__type": "AddedToken",
+ "content": "",
+ "lstrip": false,
+ "normalized": true,
+ "rstrip": false,
+ "single_word": false
+ },
+ "use_default_system_prompt": true,
+ "use_fast": true
+}