lrsoft commited on
Commit
6002451
·
1 Parent(s): 24d9b94

Add model files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +3 -0
  2. MiniChat-1.5-3B-q4f16_1-vulkan.dll +3 -0
  3. MiniChat-1.5-3B-q4f16_1-vulkan.exp +0 -0
  4. MiniChat-1.5-3B-q4f16_1-vulkan.lib +3 -0
  5. params/mlc-chat-config.json +21 -0
  6. params/ndarray-cache.json +3083 -0
  7. params/params_shard_0.bin +3 -0
  8. params/params_shard_1.bin +3 -0
  9. params/params_shard_10.bin +3 -0
  10. params/params_shard_11.bin +3 -0
  11. params/params_shard_12.bin +3 -0
  12. params/params_shard_13.bin +3 -0
  13. params/params_shard_14.bin +3 -0
  14. params/params_shard_15.bin +3 -0
  15. params/params_shard_16.bin +3 -0
  16. params/params_shard_17.bin +3 -0
  17. params/params_shard_18.bin +3 -0
  18. params/params_shard_19.bin +3 -0
  19. params/params_shard_2.bin +3 -0
  20. params/params_shard_20.bin +3 -0
  21. params/params_shard_21.bin +3 -0
  22. params/params_shard_22.bin +3 -0
  23. params/params_shard_23.bin +3 -0
  24. params/params_shard_24.bin +3 -0
  25. params/params_shard_25.bin +3 -0
  26. params/params_shard_26.bin +3 -0
  27. params/params_shard_27.bin +3 -0
  28. params/params_shard_28.bin +3 -0
  29. params/params_shard_29.bin +3 -0
  30. params/params_shard_3.bin +3 -0
  31. params/params_shard_30.bin +3 -0
  32. params/params_shard_31.bin +3 -0
  33. params/params_shard_32.bin +3 -0
  34. params/params_shard_33.bin +3 -0
  35. params/params_shard_34.bin +3 -0
  36. params/params_shard_35.bin +3 -0
  37. params/params_shard_36.bin +3 -0
  38. params/params_shard_37.bin +3 -0
  39. params/params_shard_38.bin +3 -0
  40. params/params_shard_39.bin +3 -0
  41. params/params_shard_4.bin +3 -0
  42. params/params_shard_40.bin +3 -0
  43. params/params_shard_41.bin +3 -0
  44. params/params_shard_42.bin +3 -0
  45. params/params_shard_43.bin +3 -0
  46. params/params_shard_44.bin +3 -0
  47. params/params_shard_45.bin +3 -0
  48. params/params_shard_46.bin +3 -0
  49. params/params_shard_47.bin +3 -0
  50. params/params_shard_48.bin +3 -0
.gitattributes CHANGED
@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.so filter=lfs diff=lfs merge=lfs -text
37
+ *.dll filter=lfs diff=lfs merge=lfs -text
38
+ *.lib filter=lfs diff=lfs merge=lfs -text
MiniChat-1.5-3B-q4f16_1-vulkan.dll ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be81332f4249e7fcc4fff237d988064112d77280f06a6ced02a35232c932d90c
3
+ size 26675712
MiniChat-1.5-3B-q4f16_1-vulkan.exp ADDED
Binary file (7.37 kB). View file
 
MiniChat-1.5-3B-q4f16_1-vulkan.lib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ea706f1d92d34e752c22794cde07923436f6c807ac8cd1bdb0136d44b842245
3
+ size 14110
params/mlc-chat-config.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_lib": "MiniChat-1.5-3B-q4f16_1",
3
+ "local_id": "MiniChat-1.5-3B-q4f16_1",
4
+ "conv_template": "llama_default",
5
+ "temperature": 0.7,
6
+ "repetition_penalty": 1.0,
7
+ "top_p": 0.95,
8
+ "mean_gen_len": 128,
9
+ "max_gen_len": 4096,
10
+ "num_shards": 1,
11
+ "use_presharded_weights": false,
12
+ "shift_fill_factor": 0.3,
13
+ "tokenizer_files": [
14
+ "tokenizer.model"
15
+ ],
16
+ "model_category": "llama",
17
+ "model_name": "MiniChat-1.5-3B",
18
+ "vocab_size": 49216,
19
+ "prefill_chunk_size": -1,
20
+ "max_window_size": 4096
21
+ }
params/ndarray-cache.json ADDED
@@ -0,0 +1,3083 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "metadata": {
3
+ "ParamSize": 247
4
+ },
5
+ "records": [
6
+ {
7
+ "dataPath": "params_shard_0.bin",
8
+ "format": "raw-shard",
9
+ "nbytes": 75595776,
10
+ "records": [
11
+ {
12
+ "name": "param_0",
13
+ "shape": [
14
+ 49216,
15
+ 384
16
+ ],
17
+ "dtype": "uint32",
18
+ "format": "raw",
19
+ "nbytes": 75595776,
20
+ "byteOffset": 0
21
+ }
22
+ ],
23
+ "md5sum": "ecf15d3f0901ab7456e8e0af8ced507c"
24
+ },
25
+ {
26
+ "dataPath": "params_shard_1.bin",
27
+ "format": "raw-shard",
28
+ "nbytes": 25165824,
29
+ "records": [
30
+ {
31
+ "name": "param_6",
32
+ "shape": [
33
+ 16384,
34
+ 384
35
+ ],
36
+ "dtype": "uint32",
37
+ "format": "raw",
38
+ "nbytes": 25165824,
39
+ "byteOffset": 0
40
+ }
41
+ ],
42
+ "md5sum": "9bbebd6e9fb88198483ac084144d55a6"
43
+ },
44
+ {
45
+ "dataPath": "params_shard_2.bin",
46
+ "format": "raw-shard",
47
+ "nbytes": 30683136,
48
+ "records": [
49
+ {
50
+ "name": "param_1",
51
+ "shape": [
52
+ 49216,
53
+ 96
54
+ ],
55
+ "dtype": "float16",
56
+ "format": "raw",
57
+ "nbytes": 9449472,
58
+ "byteOffset": 0
59
+ },
60
+ {
61
+ "name": "param_2",
62
+ "shape": [
63
+ 9216,
64
+ 384
65
+ ],
66
+ "dtype": "uint32",
67
+ "format": "raw",
68
+ "nbytes": 14155776,
69
+ "byteOffset": 9449472
70
+ },
71
+ {
72
+ "name": "param_3",
73
+ "shape": [
74
+ 9216,
75
+ 96
76
+ ],
77
+ "dtype": "float16",
78
+ "format": "raw",
79
+ "nbytes": 1769472,
80
+ "byteOffset": 23605248
81
+ },
82
+ {
83
+ "name": "param_4",
84
+ "shape": [
85
+ 3072,
86
+ 384
87
+ ],
88
+ "dtype": "uint32",
89
+ "format": "raw",
90
+ "nbytes": 4718592,
91
+ "byteOffset": 25374720
92
+ },
93
+ {
94
+ "name": "param_5",
95
+ "shape": [
96
+ 3072,
97
+ 96
98
+ ],
99
+ "dtype": "float16",
100
+ "format": "raw",
101
+ "nbytes": 589824,
102
+ "byteOffset": 30093312
103
+ }
104
+ ],
105
+ "md5sum": "2e5970708026d9b687364767425202cb"
106
+ },
107
+ {
108
+ "dataPath": "params_shard_3.bin",
109
+ "format": "raw-shard",
110
+ "nbytes": 33239040,
111
+ "records": [
112
+ {
113
+ "name": "param_7",
114
+ "shape": [
115
+ 16384,
116
+ 96
117
+ ],
118
+ "dtype": "float16",
119
+ "format": "raw",
120
+ "nbytes": 3145728,
121
+ "byteOffset": 0
122
+ },
123
+ {
124
+ "name": "param_8",
125
+ "shape": [
126
+ 3072,
127
+ 1024
128
+ ],
129
+ "dtype": "uint32",
130
+ "format": "raw",
131
+ "nbytes": 12582912,
132
+ "byteOffset": 3145728
133
+ },
134
+ {
135
+ "name": "param_9",
136
+ "shape": [
137
+ 3072,
138
+ 256
139
+ ],
140
+ "dtype": "float16",
141
+ "format": "raw",
142
+ "nbytes": 1572864,
143
+ "byteOffset": 15728640
144
+ },
145
+ {
146
+ "name": "param_10",
147
+ "shape": [
148
+ 3072
149
+ ],
150
+ "dtype": "float16",
151
+ "format": "raw",
152
+ "nbytes": 6144,
153
+ "byteOffset": 17301504
154
+ },
155
+ {
156
+ "name": "param_11",
157
+ "shape": [
158
+ 3072
159
+ ],
160
+ "dtype": "float16",
161
+ "format": "raw",
162
+ "nbytes": 6144,
163
+ "byteOffset": 17307648
164
+ },
165
+ {
166
+ "name": "param_12",
167
+ "shape": [
168
+ 9216,
169
+ 384
170
+ ],
171
+ "dtype": "uint32",
172
+ "format": "raw",
173
+ "nbytes": 14155776,
174
+ "byteOffset": 17313792
175
+ },
176
+ {
177
+ "name": "param_13",
178
+ "shape": [
179
+ 9216,
180
+ 96
181
+ ],
182
+ "dtype": "float16",
183
+ "format": "raw",
184
+ "nbytes": 1769472,
185
+ "byteOffset": 31469568
186
+ }
187
+ ],
188
+ "md5sum": "9f934199d76c5d26646f3d545ab72fff"
189
+ },
190
+ {
191
+ "dataPath": "params_shard_4.bin",
192
+ "format": "raw-shard",
193
+ "nbytes": 30474240,
194
+ "records": [
195
+ {
196
+ "name": "param_14",
197
+ "shape": [
198
+ 3072,
199
+ 384
200
+ ],
201
+ "dtype": "uint32",
202
+ "format": "raw",
203
+ "nbytes": 4718592,
204
+ "byteOffset": 0
205
+ },
206
+ {
207
+ "name": "param_15",
208
+ "shape": [
209
+ 3072,
210
+ 96
211
+ ],
212
+ "dtype": "float16",
213
+ "format": "raw",
214
+ "nbytes": 589824,
215
+ "byteOffset": 4718592
216
+ },
217
+ {
218
+ "name": "param_16",
219
+ "shape": [
220
+ 16384,
221
+ 384
222
+ ],
223
+ "dtype": "uint32",
224
+ "format": "raw",
225
+ "nbytes": 25165824,
226
+ "byteOffset": 5308416
227
+ }
228
+ ],
229
+ "md5sum": "a3cb6df79e4429abc2be010fedfc51d1"
230
+ },
231
+ {
232
+ "dataPath": "params_shard_5.bin",
233
+ "format": "raw-shard",
234
+ "nbytes": 33239040,
235
+ "records": [
236
+ {
237
+ "name": "param_17",
238
+ "shape": [
239
+ 16384,
240
+ 96
241
+ ],
242
+ "dtype": "float16",
243
+ "format": "raw",
244
+ "nbytes": 3145728,
245
+ "byteOffset": 0
246
+ },
247
+ {
248
+ "name": "param_18",
249
+ "shape": [
250
+ 3072,
251
+ 1024
252
+ ],
253
+ "dtype": "uint32",
254
+ "format": "raw",
255
+ "nbytes": 12582912,
256
+ "byteOffset": 3145728
257
+ },
258
+ {
259
+ "name": "param_19",
260
+ "shape": [
261
+ 3072,
262
+ 256
263
+ ],
264
+ "dtype": "float16",
265
+ "format": "raw",
266
+ "nbytes": 1572864,
267
+ "byteOffset": 15728640
268
+ },
269
+ {
270
+ "name": "param_20",
271
+ "shape": [
272
+ 3072
273
+ ],
274
+ "dtype": "float16",
275
+ "format": "raw",
276
+ "nbytes": 6144,
277
+ "byteOffset": 17301504
278
+ },
279
+ {
280
+ "name": "param_21",
281
+ "shape": [
282
+ 3072
283
+ ],
284
+ "dtype": "float16",
285
+ "format": "raw",
286
+ "nbytes": 6144,
287
+ "byteOffset": 17307648
288
+ },
289
+ {
290
+ "name": "param_22",
291
+ "shape": [
292
+ 9216,
293
+ 384
294
+ ],
295
+ "dtype": "uint32",
296
+ "format": "raw",
297
+ "nbytes": 14155776,
298
+ "byteOffset": 17313792
299
+ },
300
+ {
301
+ "name": "param_23",
302
+ "shape": [
303
+ 9216,
304
+ 96
305
+ ],
306
+ "dtype": "float16",
307
+ "format": "raw",
308
+ "nbytes": 1769472,
309
+ "byteOffset": 31469568
310
+ }
311
+ ],
312
+ "md5sum": "abf83c3c7e851bb5767f197da8cb1dac"
313
+ },
314
+ {
315
+ "dataPath": "params_shard_6.bin",
316
+ "format": "raw-shard",
317
+ "nbytes": 30474240,
318
+ "records": [
319
+ {
320
+ "name": "param_24",
321
+ "shape": [
322
+ 3072,
323
+ 384
324
+ ],
325
+ "dtype": "uint32",
326
+ "format": "raw",
327
+ "nbytes": 4718592,
328
+ "byteOffset": 0
329
+ },
330
+ {
331
+ "name": "param_25",
332
+ "shape": [
333
+ 3072,
334
+ 96
335
+ ],
336
+ "dtype": "float16",
337
+ "format": "raw",
338
+ "nbytes": 589824,
339
+ "byteOffset": 4718592
340
+ },
341
+ {
342
+ "name": "param_26",
343
+ "shape": [
344
+ 16384,
345
+ 384
346
+ ],
347
+ "dtype": "uint32",
348
+ "format": "raw",
349
+ "nbytes": 25165824,
350
+ "byteOffset": 5308416
351
+ }
352
+ ],
353
+ "md5sum": "6ce898064ed0861322bbf62e9d70d729"
354
+ },
355
+ {
356
+ "dataPath": "params_shard_7.bin",
357
+ "format": "raw-shard",
358
+ "nbytes": 33239040,
359
+ "records": [
360
+ {
361
+ "name": "param_27",
362
+ "shape": [
363
+ 16384,
364
+ 96
365
+ ],
366
+ "dtype": "float16",
367
+ "format": "raw",
368
+ "nbytes": 3145728,
369
+ "byteOffset": 0
370
+ },
371
+ {
372
+ "name": "param_28",
373
+ "shape": [
374
+ 3072,
375
+ 1024
376
+ ],
377
+ "dtype": "uint32",
378
+ "format": "raw",
379
+ "nbytes": 12582912,
380
+ "byteOffset": 3145728
381
+ },
382
+ {
383
+ "name": "param_29",
384
+ "shape": [
385
+ 3072,
386
+ 256
387
+ ],
388
+ "dtype": "float16",
389
+ "format": "raw",
390
+ "nbytes": 1572864,
391
+ "byteOffset": 15728640
392
+ },
393
+ {
394
+ "name": "param_30",
395
+ "shape": [
396
+ 3072
397
+ ],
398
+ "dtype": "float16",
399
+ "format": "raw",
400
+ "nbytes": 6144,
401
+ "byteOffset": 17301504
402
+ },
403
+ {
404
+ "name": "param_31",
405
+ "shape": [
406
+ 3072
407
+ ],
408
+ "dtype": "float16",
409
+ "format": "raw",
410
+ "nbytes": 6144,
411
+ "byteOffset": 17307648
412
+ },
413
+ {
414
+ "name": "param_32",
415
+ "shape": [
416
+ 9216,
417
+ 384
418
+ ],
419
+ "dtype": "uint32",
420
+ "format": "raw",
421
+ "nbytes": 14155776,
422
+ "byteOffset": 17313792
423
+ },
424
+ {
425
+ "name": "param_33",
426
+ "shape": [
427
+ 9216,
428
+ 96
429
+ ],
430
+ "dtype": "float16",
431
+ "format": "raw",
432
+ "nbytes": 1769472,
433
+ "byteOffset": 31469568
434
+ }
435
+ ],
436
+ "md5sum": "172bd66af74d0e34491ae5bb801be91a"
437
+ },
438
+ {
439
+ "dataPath": "params_shard_8.bin",
440
+ "format": "raw-shard",
441
+ "nbytes": 30474240,
442
+ "records": [
443
+ {
444
+ "name": "param_34",
445
+ "shape": [
446
+ 3072,
447
+ 384
448
+ ],
449
+ "dtype": "uint32",
450
+ "format": "raw",
451
+ "nbytes": 4718592,
452
+ "byteOffset": 0
453
+ },
454
+ {
455
+ "name": "param_35",
456
+ "shape": [
457
+ 3072,
458
+ 96
459
+ ],
460
+ "dtype": "float16",
461
+ "format": "raw",
462
+ "nbytes": 589824,
463
+ "byteOffset": 4718592
464
+ },
465
+ {
466
+ "name": "param_36",
467
+ "shape": [
468
+ 16384,
469
+ 384
470
+ ],
471
+ "dtype": "uint32",
472
+ "format": "raw",
473
+ "nbytes": 25165824,
474
+ "byteOffset": 5308416
475
+ }
476
+ ],
477
+ "md5sum": "80622e63178dc3e00ced75b53b23fd35"
478
+ },
479
+ {
480
+ "dataPath": "params_shard_9.bin",
481
+ "format": "raw-shard",
482
+ "nbytes": 33239040,
483
+ "records": [
484
+ {
485
+ "name": "param_37",
486
+ "shape": [
487
+ 16384,
488
+ 96
489
+ ],
490
+ "dtype": "float16",
491
+ "format": "raw",
492
+ "nbytes": 3145728,
493
+ "byteOffset": 0
494
+ },
495
+ {
496
+ "name": "param_38",
497
+ "shape": [
498
+ 3072,
499
+ 1024
500
+ ],
501
+ "dtype": "uint32",
502
+ "format": "raw",
503
+ "nbytes": 12582912,
504
+ "byteOffset": 3145728
505
+ },
506
+ {
507
+ "name": "param_39",
508
+ "shape": [
509
+ 3072,
510
+ 256
511
+ ],
512
+ "dtype": "float16",
513
+ "format": "raw",
514
+ "nbytes": 1572864,
515
+ "byteOffset": 15728640
516
+ },
517
+ {
518
+ "name": "param_40",
519
+ "shape": [
520
+ 3072
521
+ ],
522
+ "dtype": "float16",
523
+ "format": "raw",
524
+ "nbytes": 6144,
525
+ "byteOffset": 17301504
526
+ },
527
+ {
528
+ "name": "param_41",
529
+ "shape": [
530
+ 3072
531
+ ],
532
+ "dtype": "float16",
533
+ "format": "raw",
534
+ "nbytes": 6144,
535
+ "byteOffset": 17307648
536
+ },
537
+ {
538
+ "name": "param_42",
539
+ "shape": [
540
+ 9216,
541
+ 384
542
+ ],
543
+ "dtype": "uint32",
544
+ "format": "raw",
545
+ "nbytes": 14155776,
546
+ "byteOffset": 17313792
547
+ },
548
+ {
549
+ "name": "param_43",
550
+ "shape": [
551
+ 9216,
552
+ 96
553
+ ],
554
+ "dtype": "float16",
555
+ "format": "raw",
556
+ "nbytes": 1769472,
557
+ "byteOffset": 31469568
558
+ }
559
+ ],
560
+ "md5sum": "1b105ec9d866d775cb69379c40757f88"
561
+ },
562
+ {
563
+ "dataPath": "params_shard_10.bin",
564
+ "format": "raw-shard",
565
+ "nbytes": 30474240,
566
+ "records": [
567
+ {
568
+ "name": "param_44",
569
+ "shape": [
570
+ 3072,
571
+ 384
572
+ ],
573
+ "dtype": "uint32",
574
+ "format": "raw",
575
+ "nbytes": 4718592,
576
+ "byteOffset": 0
577
+ },
578
+ {
579
+ "name": "param_45",
580
+ "shape": [
581
+ 3072,
582
+ 96
583
+ ],
584
+ "dtype": "float16",
585
+ "format": "raw",
586
+ "nbytes": 589824,
587
+ "byteOffset": 4718592
588
+ },
589
+ {
590
+ "name": "param_46",
591
+ "shape": [
592
+ 16384,
593
+ 384
594
+ ],
595
+ "dtype": "uint32",
596
+ "format": "raw",
597
+ "nbytes": 25165824,
598
+ "byteOffset": 5308416
599
+ }
600
+ ],
601
+ "md5sum": "8ca5fd22e33b7ecfc4edb22c2429bea0"
602
+ },
603
+ {
604
+ "dataPath": "params_shard_11.bin",
605
+ "format": "raw-shard",
606
+ "nbytes": 33239040,
607
+ "records": [
608
+ {
609
+ "name": "param_47",
610
+ "shape": [
611
+ 16384,
612
+ 96
613
+ ],
614
+ "dtype": "float16",
615
+ "format": "raw",
616
+ "nbytes": 3145728,
617
+ "byteOffset": 0
618
+ },
619
+ {
620
+ "name": "param_48",
621
+ "shape": [
622
+ 3072,
623
+ 1024
624
+ ],
625
+ "dtype": "uint32",
626
+ "format": "raw",
627
+ "nbytes": 12582912,
628
+ "byteOffset": 3145728
629
+ },
630
+ {
631
+ "name": "param_49",
632
+ "shape": [
633
+ 3072,
634
+ 256
635
+ ],
636
+ "dtype": "float16",
637
+ "format": "raw",
638
+ "nbytes": 1572864,
639
+ "byteOffset": 15728640
640
+ },
641
+ {
642
+ "name": "param_50",
643
+ "shape": [
644
+ 3072
645
+ ],
646
+ "dtype": "float16",
647
+ "format": "raw",
648
+ "nbytes": 6144,
649
+ "byteOffset": 17301504
650
+ },
651
+ {
652
+ "name": "param_51",
653
+ "shape": [
654
+ 3072
655
+ ],
656
+ "dtype": "float16",
657
+ "format": "raw",
658
+ "nbytes": 6144,
659
+ "byteOffset": 17307648
660
+ },
661
+ {
662
+ "name": "param_52",
663
+ "shape": [
664
+ 9216,
665
+ 384
666
+ ],
667
+ "dtype": "uint32",
668
+ "format": "raw",
669
+ "nbytes": 14155776,
670
+ "byteOffset": 17313792
671
+ },
672
+ {
673
+ "name": "param_53",
674
+ "shape": [
675
+ 9216,
676
+ 96
677
+ ],
678
+ "dtype": "float16",
679
+ "format": "raw",
680
+ "nbytes": 1769472,
681
+ "byteOffset": 31469568
682
+ }
683
+ ],
684
+ "md5sum": "33dbf522d5e71a2c9c80bba1cd630861"
685
+ },
686
+ {
687
+ "dataPath": "params_shard_12.bin",
688
+ "format": "raw-shard",
689
+ "nbytes": 30474240,
690
+ "records": [
691
+ {
692
+ "name": "param_54",
693
+ "shape": [
694
+ 3072,
695
+ 384
696
+ ],
697
+ "dtype": "uint32",
698
+ "format": "raw",
699
+ "nbytes": 4718592,
700
+ "byteOffset": 0
701
+ },
702
+ {
703
+ "name": "param_55",
704
+ "shape": [
705
+ 3072,
706
+ 96
707
+ ],
708
+ "dtype": "float16",
709
+ "format": "raw",
710
+ "nbytes": 589824,
711
+ "byteOffset": 4718592
712
+ },
713
+ {
714
+ "name": "param_56",
715
+ "shape": [
716
+ 16384,
717
+ 384
718
+ ],
719
+ "dtype": "uint32",
720
+ "format": "raw",
721
+ "nbytes": 25165824,
722
+ "byteOffset": 5308416
723
+ }
724
+ ],
725
+ "md5sum": "ffc57c8bae42beb9ca8bd2f58a9e4b90"
726
+ },
727
+ {
728
+ "dataPath": "params_shard_13.bin",
729
+ "format": "raw-shard",
730
+ "nbytes": 33239040,
731
+ "records": [
732
+ {
733
+ "name": "param_57",
734
+ "shape": [
735
+ 16384,
736
+ 96
737
+ ],
738
+ "dtype": "float16",
739
+ "format": "raw",
740
+ "nbytes": 3145728,
741
+ "byteOffset": 0
742
+ },
743
+ {
744
+ "name": "param_58",
745
+ "shape": [
746
+ 3072,
747
+ 1024
748
+ ],
749
+ "dtype": "uint32",
750
+ "format": "raw",
751
+ "nbytes": 12582912,
752
+ "byteOffset": 3145728
753
+ },
754
+ {
755
+ "name": "param_59",
756
+ "shape": [
757
+ 3072,
758
+ 256
759
+ ],
760
+ "dtype": "float16",
761
+ "format": "raw",
762
+ "nbytes": 1572864,
763
+ "byteOffset": 15728640
764
+ },
765
+ {
766
+ "name": "param_60",
767
+ "shape": [
768
+ 3072
769
+ ],
770
+ "dtype": "float16",
771
+ "format": "raw",
772
+ "nbytes": 6144,
773
+ "byteOffset": 17301504
774
+ },
775
+ {
776
+ "name": "param_61",
777
+ "shape": [
778
+ 3072
779
+ ],
780
+ "dtype": "float16",
781
+ "format": "raw",
782
+ "nbytes": 6144,
783
+ "byteOffset": 17307648
784
+ },
785
+ {
786
+ "name": "param_62",
787
+ "shape": [
788
+ 9216,
789
+ 384
790
+ ],
791
+ "dtype": "uint32",
792
+ "format": "raw",
793
+ "nbytes": 14155776,
794
+ "byteOffset": 17313792
795
+ },
796
+ {
797
+ "name": "param_63",
798
+ "shape": [
799
+ 9216,
800
+ 96
801
+ ],
802
+ "dtype": "float16",
803
+ "format": "raw",
804
+ "nbytes": 1769472,
805
+ "byteOffset": 31469568
806
+ }
807
+ ],
808
+ "md5sum": "7000c9ae4c55bccc6d8d4ff1cbfd6543"
809
+ },
810
+ {
811
+ "dataPath": "params_shard_14.bin",
812
+ "format": "raw-shard",
813
+ "nbytes": 30474240,
814
+ "records": [
815
+ {
816
+ "name": "param_64",
817
+ "shape": [
818
+ 3072,
819
+ 384
820
+ ],
821
+ "dtype": "uint32",
822
+ "format": "raw",
823
+ "nbytes": 4718592,
824
+ "byteOffset": 0
825
+ },
826
+ {
827
+ "name": "param_65",
828
+ "shape": [
829
+ 3072,
830
+ 96
831
+ ],
832
+ "dtype": "float16",
833
+ "format": "raw",
834
+ "nbytes": 589824,
835
+ "byteOffset": 4718592
836
+ },
837
+ {
838
+ "name": "param_66",
839
+ "shape": [
840
+ 16384,
841
+ 384
842
+ ],
843
+ "dtype": "uint32",
844
+ "format": "raw",
845
+ "nbytes": 25165824,
846
+ "byteOffset": 5308416
847
+ }
848
+ ],
849
+ "md5sum": "948f3bbf1c76842dde7f1b9831212144"
850
+ },
851
+ {
852
+ "dataPath": "params_shard_15.bin",
853
+ "format": "raw-shard",
854
+ "nbytes": 33239040,
855
+ "records": [
856
+ {
857
+ "name": "param_67",
858
+ "shape": [
859
+ 16384,
860
+ 96
861
+ ],
862
+ "dtype": "float16",
863
+ "format": "raw",
864
+ "nbytes": 3145728,
865
+ "byteOffset": 0
866
+ },
867
+ {
868
+ "name": "param_68",
869
+ "shape": [
870
+ 3072,
871
+ 1024
872
+ ],
873
+ "dtype": "uint32",
874
+ "format": "raw",
875
+ "nbytes": 12582912,
876
+ "byteOffset": 3145728
877
+ },
878
+ {
879
+ "name": "param_69",
880
+ "shape": [
881
+ 3072,
882
+ 256
883
+ ],
884
+ "dtype": "float16",
885
+ "format": "raw",
886
+ "nbytes": 1572864,
887
+ "byteOffset": 15728640
888
+ },
889
+ {
890
+ "name": "param_70",
891
+ "shape": [
892
+ 3072
893
+ ],
894
+ "dtype": "float16",
895
+ "format": "raw",
896
+ "nbytes": 6144,
897
+ "byteOffset": 17301504
898
+ },
899
+ {
900
+ "name": "param_71",
901
+ "shape": [
902
+ 3072
903
+ ],
904
+ "dtype": "float16",
905
+ "format": "raw",
906
+ "nbytes": 6144,
907
+ "byteOffset": 17307648
908
+ },
909
+ {
910
+ "name": "param_72",
911
+ "shape": [
912
+ 9216,
913
+ 384
914
+ ],
915
+ "dtype": "uint32",
916
+ "format": "raw",
917
+ "nbytes": 14155776,
918
+ "byteOffset": 17313792
919
+ },
920
+ {
921
+ "name": "param_73",
922
+ "shape": [
923
+ 9216,
924
+ 96
925
+ ],
926
+ "dtype": "float16",
927
+ "format": "raw",
928
+ "nbytes": 1769472,
929
+ "byteOffset": 31469568
930
+ }
931
+ ],
932
+ "md5sum": "32bec1a6997ffbfd0ab9e93f56b9ad87"
933
+ },
934
+ {
935
+ "dataPath": "params_shard_16.bin",
936
+ "format": "raw-shard",
937
+ "nbytes": 30474240,
938
+ "records": [
939
+ {
940
+ "name": "param_74",
941
+ "shape": [
942
+ 3072,
943
+ 384
944
+ ],
945
+ "dtype": "uint32",
946
+ "format": "raw",
947
+ "nbytes": 4718592,
948
+ "byteOffset": 0
949
+ },
950
+ {
951
+ "name": "param_75",
952
+ "shape": [
953
+ 3072,
954
+ 96
955
+ ],
956
+ "dtype": "float16",
957
+ "format": "raw",
958
+ "nbytes": 589824,
959
+ "byteOffset": 4718592
960
+ },
961
+ {
962
+ "name": "param_76",
963
+ "shape": [
964
+ 16384,
965
+ 384
966
+ ],
967
+ "dtype": "uint32",
968
+ "format": "raw",
969
+ "nbytes": 25165824,
970
+ "byteOffset": 5308416
971
+ }
972
+ ],
973
+ "md5sum": "8711c6302582fddaa4c9e7ed91a75c7b"
974
+ },
975
+ {
976
+ "dataPath": "params_shard_17.bin",
977
+ "format": "raw-shard",
978
+ "nbytes": 33239040,
979
+ "records": [
980
+ {
981
+ "name": "param_77",
982
+ "shape": [
983
+ 16384,
984
+ 96
985
+ ],
986
+ "dtype": "float16",
987
+ "format": "raw",
988
+ "nbytes": 3145728,
989
+ "byteOffset": 0
990
+ },
991
+ {
992
+ "name": "param_78",
993
+ "shape": [
994
+ 3072,
995
+ 1024
996
+ ],
997
+ "dtype": "uint32",
998
+ "format": "raw",
999
+ "nbytes": 12582912,
1000
+ "byteOffset": 3145728
1001
+ },
1002
+ {
1003
+ "name": "param_79",
1004
+ "shape": [
1005
+ 3072,
1006
+ 256
1007
+ ],
1008
+ "dtype": "float16",
1009
+ "format": "raw",
1010
+ "nbytes": 1572864,
1011
+ "byteOffset": 15728640
1012
+ },
1013
+ {
1014
+ "name": "param_80",
1015
+ "shape": [
1016
+ 3072
1017
+ ],
1018
+ "dtype": "float16",
1019
+ "format": "raw",
1020
+ "nbytes": 6144,
1021
+ "byteOffset": 17301504
1022
+ },
1023
+ {
1024
+ "name": "param_81",
1025
+ "shape": [
1026
+ 3072
1027
+ ],
1028
+ "dtype": "float16",
1029
+ "format": "raw",
1030
+ "nbytes": 6144,
1031
+ "byteOffset": 17307648
1032
+ },
1033
+ {
1034
+ "name": "param_82",
1035
+ "shape": [
1036
+ 9216,
1037
+ 384
1038
+ ],
1039
+ "dtype": "uint32",
1040
+ "format": "raw",
1041
+ "nbytes": 14155776,
1042
+ "byteOffset": 17313792
1043
+ },
1044
+ {
1045
+ "name": "param_83",
1046
+ "shape": [
1047
+ 9216,
1048
+ 96
1049
+ ],
1050
+ "dtype": "float16",
1051
+ "format": "raw",
1052
+ "nbytes": 1769472,
1053
+ "byteOffset": 31469568
1054
+ }
1055
+ ],
1056
+ "md5sum": "29147a956d8177b8d4b5c57754a7d670"
1057
+ },
1058
+ {
1059
+ "dataPath": "params_shard_18.bin",
1060
+ "format": "raw-shard",
1061
+ "nbytes": 30474240,
1062
+ "records": [
1063
+ {
1064
+ "name": "param_84",
1065
+ "shape": [
1066
+ 3072,
1067
+ 384
1068
+ ],
1069
+ "dtype": "uint32",
1070
+ "format": "raw",
1071
+ "nbytes": 4718592,
1072
+ "byteOffset": 0
1073
+ },
1074
+ {
1075
+ "name": "param_85",
1076
+ "shape": [
1077
+ 3072,
1078
+ 96
1079
+ ],
1080
+ "dtype": "float16",
1081
+ "format": "raw",
1082
+ "nbytes": 589824,
1083
+ "byteOffset": 4718592
1084
+ },
1085
+ {
1086
+ "name": "param_86",
1087
+ "shape": [
1088
+ 16384,
1089
+ 384
1090
+ ],
1091
+ "dtype": "uint32",
1092
+ "format": "raw",
1093
+ "nbytes": 25165824,
1094
+ "byteOffset": 5308416
1095
+ }
1096
+ ],
1097
+ "md5sum": "1471ebee434c1147a18f440f09f98e91"
1098
+ },
1099
+ {
1100
+ "dataPath": "params_shard_19.bin",
1101
+ "format": "raw-shard",
1102
+ "nbytes": 33239040,
1103
+ "records": [
1104
+ {
1105
+ "name": "param_87",
1106
+ "shape": [
1107
+ 16384,
1108
+ 96
1109
+ ],
1110
+ "dtype": "float16",
1111
+ "format": "raw",
1112
+ "nbytes": 3145728,
1113
+ "byteOffset": 0
1114
+ },
1115
+ {
1116
+ "name": "param_88",
1117
+ "shape": [
1118
+ 3072,
1119
+ 1024
1120
+ ],
1121
+ "dtype": "uint32",
1122
+ "format": "raw",
1123
+ "nbytes": 12582912,
1124
+ "byteOffset": 3145728
1125
+ },
1126
+ {
1127
+ "name": "param_89",
1128
+ "shape": [
1129
+ 3072,
1130
+ 256
1131
+ ],
1132
+ "dtype": "float16",
1133
+ "format": "raw",
1134
+ "nbytes": 1572864,
1135
+ "byteOffset": 15728640
1136
+ },
1137
+ {
1138
+ "name": "param_90",
1139
+ "shape": [
1140
+ 3072
1141
+ ],
1142
+ "dtype": "float16",
1143
+ "format": "raw",
1144
+ "nbytes": 6144,
1145
+ "byteOffset": 17301504
1146
+ },
1147
+ {
1148
+ "name": "param_91",
1149
+ "shape": [
1150
+ 3072
1151
+ ],
1152
+ "dtype": "float16",
1153
+ "format": "raw",
1154
+ "nbytes": 6144,
1155
+ "byteOffset": 17307648
1156
+ },
1157
+ {
1158
+ "name": "param_92",
1159
+ "shape": [
1160
+ 9216,
1161
+ 384
1162
+ ],
1163
+ "dtype": "uint32",
1164
+ "format": "raw",
1165
+ "nbytes": 14155776,
1166
+ "byteOffset": 17313792
1167
+ },
1168
+ {
1169
+ "name": "param_93",
1170
+ "shape": [
1171
+ 9216,
1172
+ 96
1173
+ ],
1174
+ "dtype": "float16",
1175
+ "format": "raw",
1176
+ "nbytes": 1769472,
1177
+ "byteOffset": 31469568
1178
+ }
1179
+ ],
1180
+ "md5sum": "0e32a9c897b51680f461e8b1008f5701"
1181
+ },
1182
+ {
1183
+ "dataPath": "params_shard_20.bin",
1184
+ "format": "raw-shard",
1185
+ "nbytes": 30474240,
1186
+ "records": [
1187
+ {
1188
+ "name": "param_94",
1189
+ "shape": [
1190
+ 3072,
1191
+ 384
1192
+ ],
1193
+ "dtype": "uint32",
1194
+ "format": "raw",
1195
+ "nbytes": 4718592,
1196
+ "byteOffset": 0
1197
+ },
1198
+ {
1199
+ "name": "param_95",
1200
+ "shape": [
1201
+ 3072,
1202
+ 96
1203
+ ],
1204
+ "dtype": "float16",
1205
+ "format": "raw",
1206
+ "nbytes": 589824,
1207
+ "byteOffset": 4718592
1208
+ },
1209
+ {
1210
+ "name": "param_96",
1211
+ "shape": [
1212
+ 16384,
1213
+ 384
1214
+ ],
1215
+ "dtype": "uint32",
1216
+ "format": "raw",
1217
+ "nbytes": 25165824,
1218
+ "byteOffset": 5308416
1219
+ }
1220
+ ],
1221
+ "md5sum": "e26e42c69c260b3bb2ab55694b1482fa"
1222
+ },
1223
+ {
1224
+ "dataPath": "params_shard_21.bin",
1225
+ "format": "raw-shard",
1226
+ "nbytes": 33239040,
1227
+ "records": [
1228
+ {
1229
+ "name": "param_97",
1230
+ "shape": [
1231
+ 16384,
1232
+ 96
1233
+ ],
1234
+ "dtype": "float16",
1235
+ "format": "raw",
1236
+ "nbytes": 3145728,
1237
+ "byteOffset": 0
1238
+ },
1239
+ {
1240
+ "name": "param_98",
1241
+ "shape": [
1242
+ 3072,
1243
+ 1024
1244
+ ],
1245
+ "dtype": "uint32",
1246
+ "format": "raw",
1247
+ "nbytes": 12582912,
1248
+ "byteOffset": 3145728
1249
+ },
1250
+ {
1251
+ "name": "param_99",
1252
+ "shape": [
1253
+ 3072,
1254
+ 256
1255
+ ],
1256
+ "dtype": "float16",
1257
+ "format": "raw",
1258
+ "nbytes": 1572864,
1259
+ "byteOffset": 15728640
1260
+ },
1261
+ {
1262
+ "name": "param_100",
1263
+ "shape": [
1264
+ 3072
1265
+ ],
1266
+ "dtype": "float16",
1267
+ "format": "raw",
1268
+ "nbytes": 6144,
1269
+ "byteOffset": 17301504
1270
+ },
1271
+ {
1272
+ "name": "param_101",
1273
+ "shape": [
1274
+ 3072
1275
+ ],
1276
+ "dtype": "float16",
1277
+ "format": "raw",
1278
+ "nbytes": 6144,
1279
+ "byteOffset": 17307648
1280
+ },
1281
+ {
1282
+ "name": "param_102",
1283
+ "shape": [
1284
+ 9216,
1285
+ 384
1286
+ ],
1287
+ "dtype": "uint32",
1288
+ "format": "raw",
1289
+ "nbytes": 14155776,
1290
+ "byteOffset": 17313792
1291
+ },
1292
+ {
1293
+ "name": "param_103",
1294
+ "shape": [
1295
+ 9216,
1296
+ 96
1297
+ ],
1298
+ "dtype": "float16",
1299
+ "format": "raw",
1300
+ "nbytes": 1769472,
1301
+ "byteOffset": 31469568
1302
+ }
1303
+ ],
1304
+ "md5sum": "ae647c3f3d6a097e5470cf69248d3a63"
1305
+ },
1306
+ {
1307
+ "dataPath": "params_shard_22.bin",
1308
+ "format": "raw-shard",
1309
+ "nbytes": 30474240,
1310
+ "records": [
1311
+ {
1312
+ "name": "param_104",
1313
+ "shape": [
1314
+ 3072,
1315
+ 384
1316
+ ],
1317
+ "dtype": "uint32",
1318
+ "format": "raw",
1319
+ "nbytes": 4718592,
1320
+ "byteOffset": 0
1321
+ },
1322
+ {
1323
+ "name": "param_105",
1324
+ "shape": [
1325
+ 3072,
1326
+ 96
1327
+ ],
1328
+ "dtype": "float16",
1329
+ "format": "raw",
1330
+ "nbytes": 589824,
1331
+ "byteOffset": 4718592
1332
+ },
1333
+ {
1334
+ "name": "param_106",
1335
+ "shape": [
1336
+ 16384,
1337
+ 384
1338
+ ],
1339
+ "dtype": "uint32",
1340
+ "format": "raw",
1341
+ "nbytes": 25165824,
1342
+ "byteOffset": 5308416
1343
+ }
1344
+ ],
1345
+ "md5sum": "871acb8160143ca04a5347cc79ec7885"
1346
+ },
1347
+ {
1348
+ "dataPath": "params_shard_23.bin",
1349
+ "format": "raw-shard",
1350
+ "nbytes": 33239040,
1351
+ "records": [
1352
+ {
1353
+ "name": "param_107",
1354
+ "shape": [
1355
+ 16384,
1356
+ 96
1357
+ ],
1358
+ "dtype": "float16",
1359
+ "format": "raw",
1360
+ "nbytes": 3145728,
1361
+ "byteOffset": 0
1362
+ },
1363
+ {
1364
+ "name": "param_108",
1365
+ "shape": [
1366
+ 3072,
1367
+ 1024
1368
+ ],
1369
+ "dtype": "uint32",
1370
+ "format": "raw",
1371
+ "nbytes": 12582912,
1372
+ "byteOffset": 3145728
1373
+ },
1374
+ {
1375
+ "name": "param_109",
1376
+ "shape": [
1377
+ 3072,
1378
+ 256
1379
+ ],
1380
+ "dtype": "float16",
1381
+ "format": "raw",
1382
+ "nbytes": 1572864,
1383
+ "byteOffset": 15728640
1384
+ },
1385
+ {
1386
+ "name": "param_110",
1387
+ "shape": [
1388
+ 3072
1389
+ ],
1390
+ "dtype": "float16",
1391
+ "format": "raw",
1392
+ "nbytes": 6144,
1393
+ "byteOffset": 17301504
1394
+ },
1395
+ {
1396
+ "name": "param_111",
1397
+ "shape": [
1398
+ 3072
1399
+ ],
1400
+ "dtype": "float16",
1401
+ "format": "raw",
1402
+ "nbytes": 6144,
1403
+ "byteOffset": 17307648
1404
+ },
1405
+ {
1406
+ "name": "param_112",
1407
+ "shape": [
1408
+ 9216,
1409
+ 384
1410
+ ],
1411
+ "dtype": "uint32",
1412
+ "format": "raw",
1413
+ "nbytes": 14155776,
1414
+ "byteOffset": 17313792
1415
+ },
1416
+ {
1417
+ "name": "param_113",
1418
+ "shape": [
1419
+ 9216,
1420
+ 96
1421
+ ],
1422
+ "dtype": "float16",
1423
+ "format": "raw",
1424
+ "nbytes": 1769472,
1425
+ "byteOffset": 31469568
1426
+ }
1427
+ ],
1428
+ "md5sum": "a98b06905334de6643492605ed0fa08f"
1429
+ },
1430
+ {
1431
+ "dataPath": "params_shard_24.bin",
1432
+ "format": "raw-shard",
1433
+ "nbytes": 30474240,
1434
+ "records": [
1435
+ {
1436
+ "name": "param_114",
1437
+ "shape": [
1438
+ 3072,
1439
+ 384
1440
+ ],
1441
+ "dtype": "uint32",
1442
+ "format": "raw",
1443
+ "nbytes": 4718592,
1444
+ "byteOffset": 0
1445
+ },
1446
+ {
1447
+ "name": "param_115",
1448
+ "shape": [
1449
+ 3072,
1450
+ 96
1451
+ ],
1452
+ "dtype": "float16",
1453
+ "format": "raw",
1454
+ "nbytes": 589824,
1455
+ "byteOffset": 4718592
1456
+ },
1457
+ {
1458
+ "name": "param_116",
1459
+ "shape": [
1460
+ 16384,
1461
+ 384
1462
+ ],
1463
+ "dtype": "uint32",
1464
+ "format": "raw",
1465
+ "nbytes": 25165824,
1466
+ "byteOffset": 5308416
1467
+ }
1468
+ ],
1469
+ "md5sum": "a7627fcb0b8897ad5b778e2bfb633481"
1470
+ },
1471
+ {
1472
+ "dataPath": "params_shard_25.bin",
1473
+ "format": "raw-shard",
1474
+ "nbytes": 33239040,
1475
+ "records": [
1476
+ {
1477
+ "name": "param_117",
1478
+ "shape": [
1479
+ 16384,
1480
+ 96
1481
+ ],
1482
+ "dtype": "float16",
1483
+ "format": "raw",
1484
+ "nbytes": 3145728,
1485
+ "byteOffset": 0
1486
+ },
1487
+ {
1488
+ "name": "param_118",
1489
+ "shape": [
1490
+ 3072,
1491
+ 1024
1492
+ ],
1493
+ "dtype": "uint32",
1494
+ "format": "raw",
1495
+ "nbytes": 12582912,
1496
+ "byteOffset": 3145728
1497
+ },
1498
+ {
1499
+ "name": "param_119",
1500
+ "shape": [
1501
+ 3072,
1502
+ 256
1503
+ ],
1504
+ "dtype": "float16",
1505
+ "format": "raw",
1506
+ "nbytes": 1572864,
1507
+ "byteOffset": 15728640
1508
+ },
1509
+ {
1510
+ "name": "param_120",
1511
+ "shape": [
1512
+ 3072
1513
+ ],
1514
+ "dtype": "float16",
1515
+ "format": "raw",
1516
+ "nbytes": 6144,
1517
+ "byteOffset": 17301504
1518
+ },
1519
+ {
1520
+ "name": "param_121",
1521
+ "shape": [
1522
+ 3072
1523
+ ],
1524
+ "dtype": "float16",
1525
+ "format": "raw",
1526
+ "nbytes": 6144,
1527
+ "byteOffset": 17307648
1528
+ },
1529
+ {
1530
+ "name": "param_122",
1531
+ "shape": [
1532
+ 9216,
1533
+ 384
1534
+ ],
1535
+ "dtype": "uint32",
1536
+ "format": "raw",
1537
+ "nbytes": 14155776,
1538
+ "byteOffset": 17313792
1539
+ },
1540
+ {
1541
+ "name": "param_123",
1542
+ "shape": [
1543
+ 9216,
1544
+ 96
1545
+ ],
1546
+ "dtype": "float16",
1547
+ "format": "raw",
1548
+ "nbytes": 1769472,
1549
+ "byteOffset": 31469568
1550
+ }
1551
+ ],
1552
+ "md5sum": "cc15fd71e7ae435df5d24ac8efc7914b"
1553
+ },
1554
+ {
1555
+ "dataPath": "params_shard_26.bin",
1556
+ "format": "raw-shard",
1557
+ "nbytes": 30474240,
1558
+ "records": [
1559
+ {
1560
+ "name": "param_124",
1561
+ "shape": [
1562
+ 3072,
1563
+ 384
1564
+ ],
1565
+ "dtype": "uint32",
1566
+ "format": "raw",
1567
+ "nbytes": 4718592,
1568
+ "byteOffset": 0
1569
+ },
1570
+ {
1571
+ "name": "param_125",
1572
+ "shape": [
1573
+ 3072,
1574
+ 96
1575
+ ],
1576
+ "dtype": "float16",
1577
+ "format": "raw",
1578
+ "nbytes": 589824,
1579
+ "byteOffset": 4718592
1580
+ },
1581
+ {
1582
+ "name": "param_126",
1583
+ "shape": [
1584
+ 16384,
1585
+ 384
1586
+ ],
1587
+ "dtype": "uint32",
1588
+ "format": "raw",
1589
+ "nbytes": 25165824,
1590
+ "byteOffset": 5308416
1591
+ }
1592
+ ],
1593
+ "md5sum": "871cb0c0da0bd2b0fa86f5bd027f7cd4"
1594
+ },
1595
+ {
1596
+ "dataPath": "params_shard_27.bin",
1597
+ "format": "raw-shard",
1598
+ "nbytes": 33239040,
1599
+ "records": [
1600
+ {
1601
+ "name": "param_127",
1602
+ "shape": [
1603
+ 16384,
1604
+ 96
1605
+ ],
1606
+ "dtype": "float16",
1607
+ "format": "raw",
1608
+ "nbytes": 3145728,
1609
+ "byteOffset": 0
1610
+ },
1611
+ {
1612
+ "name": "param_128",
1613
+ "shape": [
1614
+ 3072,
1615
+ 1024
1616
+ ],
1617
+ "dtype": "uint32",
1618
+ "format": "raw",
1619
+ "nbytes": 12582912,
1620
+ "byteOffset": 3145728
1621
+ },
1622
+ {
1623
+ "name": "param_129",
1624
+ "shape": [
1625
+ 3072,
1626
+ 256
1627
+ ],
1628
+ "dtype": "float16",
1629
+ "format": "raw",
1630
+ "nbytes": 1572864,
1631
+ "byteOffset": 15728640
1632
+ },
1633
+ {
1634
+ "name": "param_130",
1635
+ "shape": [
1636
+ 3072
1637
+ ],
1638
+ "dtype": "float16",
1639
+ "format": "raw",
1640
+ "nbytes": 6144,
1641
+ "byteOffset": 17301504
1642
+ },
1643
+ {
1644
+ "name": "param_131",
1645
+ "shape": [
1646
+ 3072
1647
+ ],
1648
+ "dtype": "float16",
1649
+ "format": "raw",
1650
+ "nbytes": 6144,
1651
+ "byteOffset": 17307648
1652
+ },
1653
+ {
1654
+ "name": "param_132",
1655
+ "shape": [
1656
+ 9216,
1657
+ 384
1658
+ ],
1659
+ "dtype": "uint32",
1660
+ "format": "raw",
1661
+ "nbytes": 14155776,
1662
+ "byteOffset": 17313792
1663
+ },
1664
+ {
1665
+ "name": "param_133",
1666
+ "shape": [
1667
+ 9216,
1668
+ 96
1669
+ ],
1670
+ "dtype": "float16",
1671
+ "format": "raw",
1672
+ "nbytes": 1769472,
1673
+ "byteOffset": 31469568
1674
+ }
1675
+ ],
1676
+ "md5sum": "1372630bf1cc3c793393c4caa9676037"
1677
+ },
1678
+ {
1679
+ "dataPath": "params_shard_28.bin",
1680
+ "format": "raw-shard",
1681
+ "nbytes": 30474240,
1682
+ "records": [
1683
+ {
1684
+ "name": "param_134",
1685
+ "shape": [
1686
+ 3072,
1687
+ 384
1688
+ ],
1689
+ "dtype": "uint32",
1690
+ "format": "raw",
1691
+ "nbytes": 4718592,
1692
+ "byteOffset": 0
1693
+ },
1694
+ {
1695
+ "name": "param_135",
1696
+ "shape": [
1697
+ 3072,
1698
+ 96
1699
+ ],
1700
+ "dtype": "float16",
1701
+ "format": "raw",
1702
+ "nbytes": 589824,
1703
+ "byteOffset": 4718592
1704
+ },
1705
+ {
1706
+ "name": "param_136",
1707
+ "shape": [
1708
+ 16384,
1709
+ 384
1710
+ ],
1711
+ "dtype": "uint32",
1712
+ "format": "raw",
1713
+ "nbytes": 25165824,
1714
+ "byteOffset": 5308416
1715
+ }
1716
+ ],
1717
+ "md5sum": "384bce670c71430046a8c55f604dd2be"
1718
+ },
1719
+ {
1720
+ "dataPath": "params_shard_29.bin",
1721
+ "format": "raw-shard",
1722
+ "nbytes": 33239040,
1723
+ "records": [
1724
+ {
1725
+ "name": "param_137",
1726
+ "shape": [
1727
+ 16384,
1728
+ 96
1729
+ ],
1730
+ "dtype": "float16",
1731
+ "format": "raw",
1732
+ "nbytes": 3145728,
1733
+ "byteOffset": 0
1734
+ },
1735
+ {
1736
+ "name": "param_138",
1737
+ "shape": [
1738
+ 3072,
1739
+ 1024
1740
+ ],
1741
+ "dtype": "uint32",
1742
+ "format": "raw",
1743
+ "nbytes": 12582912,
1744
+ "byteOffset": 3145728
1745
+ },
1746
+ {
1747
+ "name": "param_139",
1748
+ "shape": [
1749
+ 3072,
1750
+ 256
1751
+ ],
1752
+ "dtype": "float16",
1753
+ "format": "raw",
1754
+ "nbytes": 1572864,
1755
+ "byteOffset": 15728640
1756
+ },
1757
+ {
1758
+ "name": "param_140",
1759
+ "shape": [
1760
+ 3072
1761
+ ],
1762
+ "dtype": "float16",
1763
+ "format": "raw",
1764
+ "nbytes": 6144,
1765
+ "byteOffset": 17301504
1766
+ },
1767
+ {
1768
+ "name": "param_141",
1769
+ "shape": [
1770
+ 3072
1771
+ ],
1772
+ "dtype": "float16",
1773
+ "format": "raw",
1774
+ "nbytes": 6144,
1775
+ "byteOffset": 17307648
1776
+ },
1777
+ {
1778
+ "name": "param_142",
1779
+ "shape": [
1780
+ 9216,
1781
+ 384
1782
+ ],
1783
+ "dtype": "uint32",
1784
+ "format": "raw",
1785
+ "nbytes": 14155776,
1786
+ "byteOffset": 17313792
1787
+ },
1788
+ {
1789
+ "name": "param_143",
1790
+ "shape": [
1791
+ 9216,
1792
+ 96
1793
+ ],
1794
+ "dtype": "float16",
1795
+ "format": "raw",
1796
+ "nbytes": 1769472,
1797
+ "byteOffset": 31469568
1798
+ }
1799
+ ],
1800
+ "md5sum": "c88b13da2066d10551cebd5ab92a2ce0"
1801
+ },
1802
+ {
1803
+ "dataPath": "params_shard_30.bin",
1804
+ "format": "raw-shard",
1805
+ "nbytes": 30474240,
1806
+ "records": [
1807
+ {
1808
+ "name": "param_144",
1809
+ "shape": [
1810
+ 3072,
1811
+ 384
1812
+ ],
1813
+ "dtype": "uint32",
1814
+ "format": "raw",
1815
+ "nbytes": 4718592,
1816
+ "byteOffset": 0
1817
+ },
1818
+ {
1819
+ "name": "param_145",
1820
+ "shape": [
1821
+ 3072,
1822
+ 96
1823
+ ],
1824
+ "dtype": "float16",
1825
+ "format": "raw",
1826
+ "nbytes": 589824,
1827
+ "byteOffset": 4718592
1828
+ },
1829
+ {
1830
+ "name": "param_146",
1831
+ "shape": [
1832
+ 16384,
1833
+ 384
1834
+ ],
1835
+ "dtype": "uint32",
1836
+ "format": "raw",
1837
+ "nbytes": 25165824,
1838
+ "byteOffset": 5308416
1839
+ }
1840
+ ],
1841
+ "md5sum": "810e6f3b5ab150f4900dd1022ab0a40f"
1842
+ },
1843
+ {
1844
+ "dataPath": "params_shard_31.bin",
1845
+ "format": "raw-shard",
1846
+ "nbytes": 33239040,
1847
+ "records": [
1848
+ {
1849
+ "name": "param_147",
1850
+ "shape": [
1851
+ 16384,
1852
+ 96
1853
+ ],
1854
+ "dtype": "float16",
1855
+ "format": "raw",
1856
+ "nbytes": 3145728,
1857
+ "byteOffset": 0
1858
+ },
1859
+ {
1860
+ "name": "param_148",
1861
+ "shape": [
1862
+ 3072,
1863
+ 1024
1864
+ ],
1865
+ "dtype": "uint32",
1866
+ "format": "raw",
1867
+ "nbytes": 12582912,
1868
+ "byteOffset": 3145728
1869
+ },
1870
+ {
1871
+ "name": "param_149",
1872
+ "shape": [
1873
+ 3072,
1874
+ 256
1875
+ ],
1876
+ "dtype": "float16",
1877
+ "format": "raw",
1878
+ "nbytes": 1572864,
1879
+ "byteOffset": 15728640
1880
+ },
1881
+ {
1882
+ "name": "param_150",
1883
+ "shape": [
1884
+ 3072
1885
+ ],
1886
+ "dtype": "float16",
1887
+ "format": "raw",
1888
+ "nbytes": 6144,
1889
+ "byteOffset": 17301504
1890
+ },
1891
+ {
1892
+ "name": "param_151",
1893
+ "shape": [
1894
+ 3072
1895
+ ],
1896
+ "dtype": "float16",
1897
+ "format": "raw",
1898
+ "nbytes": 6144,
1899
+ "byteOffset": 17307648
1900
+ },
1901
+ {
1902
+ "name": "param_152",
1903
+ "shape": [
1904
+ 9216,
1905
+ 384
1906
+ ],
1907
+ "dtype": "uint32",
1908
+ "format": "raw",
1909
+ "nbytes": 14155776,
1910
+ "byteOffset": 17313792
1911
+ },
1912
+ {
1913
+ "name": "param_153",
1914
+ "shape": [
1915
+ 9216,
1916
+ 96
1917
+ ],
1918
+ "dtype": "float16",
1919
+ "format": "raw",
1920
+ "nbytes": 1769472,
1921
+ "byteOffset": 31469568
1922
+ }
1923
+ ],
1924
+ "md5sum": "7831b6ba62b41e173d6a10fa2505a728"
1925
+ },
1926
+ {
1927
+ "dataPath": "params_shard_32.bin",
1928
+ "format": "raw-shard",
1929
+ "nbytes": 30474240,
1930
+ "records": [
1931
+ {
1932
+ "name": "param_154",
1933
+ "shape": [
1934
+ 3072,
1935
+ 384
1936
+ ],
1937
+ "dtype": "uint32",
1938
+ "format": "raw",
1939
+ "nbytes": 4718592,
1940
+ "byteOffset": 0
1941
+ },
1942
+ {
1943
+ "name": "param_155",
1944
+ "shape": [
1945
+ 3072,
1946
+ 96
1947
+ ],
1948
+ "dtype": "float16",
1949
+ "format": "raw",
1950
+ "nbytes": 589824,
1951
+ "byteOffset": 4718592
1952
+ },
1953
+ {
1954
+ "name": "param_156",
1955
+ "shape": [
1956
+ 16384,
1957
+ 384
1958
+ ],
1959
+ "dtype": "uint32",
1960
+ "format": "raw",
1961
+ "nbytes": 25165824,
1962
+ "byteOffset": 5308416
1963
+ }
1964
+ ],
1965
+ "md5sum": "46f5b5049ec0bd2f0244115053cb08f1"
1966
+ },
1967
+ {
1968
+ "dataPath": "params_shard_33.bin",
1969
+ "format": "raw-shard",
1970
+ "nbytes": 33239040,
1971
+ "records": [
1972
+ {
1973
+ "name": "param_157",
1974
+ "shape": [
1975
+ 16384,
1976
+ 96
1977
+ ],
1978
+ "dtype": "float16",
1979
+ "format": "raw",
1980
+ "nbytes": 3145728,
1981
+ "byteOffset": 0
1982
+ },
1983
+ {
1984
+ "name": "param_158",
1985
+ "shape": [
1986
+ 3072,
1987
+ 1024
1988
+ ],
1989
+ "dtype": "uint32",
1990
+ "format": "raw",
1991
+ "nbytes": 12582912,
1992
+ "byteOffset": 3145728
1993
+ },
1994
+ {
1995
+ "name": "param_159",
1996
+ "shape": [
1997
+ 3072,
1998
+ 256
1999
+ ],
2000
+ "dtype": "float16",
2001
+ "format": "raw",
2002
+ "nbytes": 1572864,
2003
+ "byteOffset": 15728640
2004
+ },
2005
+ {
2006
+ "name": "param_160",
2007
+ "shape": [
2008
+ 3072
2009
+ ],
2010
+ "dtype": "float16",
2011
+ "format": "raw",
2012
+ "nbytes": 6144,
2013
+ "byteOffset": 17301504
2014
+ },
2015
+ {
2016
+ "name": "param_161",
2017
+ "shape": [
2018
+ 3072
2019
+ ],
2020
+ "dtype": "float16",
2021
+ "format": "raw",
2022
+ "nbytes": 6144,
2023
+ "byteOffset": 17307648
2024
+ },
2025
+ {
2026
+ "name": "param_162",
2027
+ "shape": [
2028
+ 9216,
2029
+ 384
2030
+ ],
2031
+ "dtype": "uint32",
2032
+ "format": "raw",
2033
+ "nbytes": 14155776,
2034
+ "byteOffset": 17313792
2035
+ },
2036
+ {
2037
+ "name": "param_163",
2038
+ "shape": [
2039
+ 9216,
2040
+ 96
2041
+ ],
2042
+ "dtype": "float16",
2043
+ "format": "raw",
2044
+ "nbytes": 1769472,
2045
+ "byteOffset": 31469568
2046
+ }
2047
+ ],
2048
+ "md5sum": "d35e67cff788996fcbb377a37c2988e1"
2049
+ },
2050
+ {
2051
+ "dataPath": "params_shard_34.bin",
2052
+ "format": "raw-shard",
2053
+ "nbytes": 30474240,
2054
+ "records": [
2055
+ {
2056
+ "name": "param_164",
2057
+ "shape": [
2058
+ 3072,
2059
+ 384
2060
+ ],
2061
+ "dtype": "uint32",
2062
+ "format": "raw",
2063
+ "nbytes": 4718592,
2064
+ "byteOffset": 0
2065
+ },
2066
+ {
2067
+ "name": "param_165",
2068
+ "shape": [
2069
+ 3072,
2070
+ 96
2071
+ ],
2072
+ "dtype": "float16",
2073
+ "format": "raw",
2074
+ "nbytes": 589824,
2075
+ "byteOffset": 4718592
2076
+ },
2077
+ {
2078
+ "name": "param_166",
2079
+ "shape": [
2080
+ 16384,
2081
+ 384
2082
+ ],
2083
+ "dtype": "uint32",
2084
+ "format": "raw",
2085
+ "nbytes": 25165824,
2086
+ "byteOffset": 5308416
2087
+ }
2088
+ ],
2089
+ "md5sum": "b773d61b73cbac065381e20361f4367d"
2090
+ },
2091
+ {
2092
+ "dataPath": "params_shard_35.bin",
2093
+ "format": "raw-shard",
2094
+ "nbytes": 33239040,
2095
+ "records": [
2096
+ {
2097
+ "name": "param_167",
2098
+ "shape": [
2099
+ 16384,
2100
+ 96
2101
+ ],
2102
+ "dtype": "float16",
2103
+ "format": "raw",
2104
+ "nbytes": 3145728,
2105
+ "byteOffset": 0
2106
+ },
2107
+ {
2108
+ "name": "param_168",
2109
+ "shape": [
2110
+ 3072,
2111
+ 1024
2112
+ ],
2113
+ "dtype": "uint32",
2114
+ "format": "raw",
2115
+ "nbytes": 12582912,
2116
+ "byteOffset": 3145728
2117
+ },
2118
+ {
2119
+ "name": "param_169",
2120
+ "shape": [
2121
+ 3072,
2122
+ 256
2123
+ ],
2124
+ "dtype": "float16",
2125
+ "format": "raw",
2126
+ "nbytes": 1572864,
2127
+ "byteOffset": 15728640
2128
+ },
2129
+ {
2130
+ "name": "param_170",
2131
+ "shape": [
2132
+ 3072
2133
+ ],
2134
+ "dtype": "float16",
2135
+ "format": "raw",
2136
+ "nbytes": 6144,
2137
+ "byteOffset": 17301504
2138
+ },
2139
+ {
2140
+ "name": "param_171",
2141
+ "shape": [
2142
+ 3072
2143
+ ],
2144
+ "dtype": "float16",
2145
+ "format": "raw",
2146
+ "nbytes": 6144,
2147
+ "byteOffset": 17307648
2148
+ },
2149
+ {
2150
+ "name": "param_172",
2151
+ "shape": [
2152
+ 9216,
2153
+ 384
2154
+ ],
2155
+ "dtype": "uint32",
2156
+ "format": "raw",
2157
+ "nbytes": 14155776,
2158
+ "byteOffset": 17313792
2159
+ },
2160
+ {
2161
+ "name": "param_173",
2162
+ "shape": [
2163
+ 9216,
2164
+ 96
2165
+ ],
2166
+ "dtype": "float16",
2167
+ "format": "raw",
2168
+ "nbytes": 1769472,
2169
+ "byteOffset": 31469568
2170
+ }
2171
+ ],
2172
+ "md5sum": "26e5ed8698a8e8652345ff38879bd502"
2173
+ },
2174
+ {
2175
+ "dataPath": "params_shard_36.bin",
2176
+ "format": "raw-shard",
2177
+ "nbytes": 30474240,
2178
+ "records": [
2179
+ {
2180
+ "name": "param_174",
2181
+ "shape": [
2182
+ 3072,
2183
+ 384
2184
+ ],
2185
+ "dtype": "uint32",
2186
+ "format": "raw",
2187
+ "nbytes": 4718592,
2188
+ "byteOffset": 0
2189
+ },
2190
+ {
2191
+ "name": "param_175",
2192
+ "shape": [
2193
+ 3072,
2194
+ 96
2195
+ ],
2196
+ "dtype": "float16",
2197
+ "format": "raw",
2198
+ "nbytes": 589824,
2199
+ "byteOffset": 4718592
2200
+ },
2201
+ {
2202
+ "name": "param_176",
2203
+ "shape": [
2204
+ 16384,
2205
+ 384
2206
+ ],
2207
+ "dtype": "uint32",
2208
+ "format": "raw",
2209
+ "nbytes": 25165824,
2210
+ "byteOffset": 5308416
2211
+ }
2212
+ ],
2213
+ "md5sum": "7c8d29c2e7398736627702453541c286"
2214
+ },
2215
+ {
2216
+ "dataPath": "params_shard_37.bin",
2217
+ "format": "raw-shard",
2218
+ "nbytes": 33239040,
2219
+ "records": [
2220
+ {
2221
+ "name": "param_177",
2222
+ "shape": [
2223
+ 16384,
2224
+ 96
2225
+ ],
2226
+ "dtype": "float16",
2227
+ "format": "raw",
2228
+ "nbytes": 3145728,
2229
+ "byteOffset": 0
2230
+ },
2231
+ {
2232
+ "name": "param_178",
2233
+ "shape": [
2234
+ 3072,
2235
+ 1024
2236
+ ],
2237
+ "dtype": "uint32",
2238
+ "format": "raw",
2239
+ "nbytes": 12582912,
2240
+ "byteOffset": 3145728
2241
+ },
2242
+ {
2243
+ "name": "param_179",
2244
+ "shape": [
2245
+ 3072,
2246
+ 256
2247
+ ],
2248
+ "dtype": "float16",
2249
+ "format": "raw",
2250
+ "nbytes": 1572864,
2251
+ "byteOffset": 15728640
2252
+ },
2253
+ {
2254
+ "name": "param_180",
2255
+ "shape": [
2256
+ 3072
2257
+ ],
2258
+ "dtype": "float16",
2259
+ "format": "raw",
2260
+ "nbytes": 6144,
2261
+ "byteOffset": 17301504
2262
+ },
2263
+ {
2264
+ "name": "param_181",
2265
+ "shape": [
2266
+ 3072
2267
+ ],
2268
+ "dtype": "float16",
2269
+ "format": "raw",
2270
+ "nbytes": 6144,
2271
+ "byteOffset": 17307648
2272
+ },
2273
+ {
2274
+ "name": "param_182",
2275
+ "shape": [
2276
+ 9216,
2277
+ 384
2278
+ ],
2279
+ "dtype": "uint32",
2280
+ "format": "raw",
2281
+ "nbytes": 14155776,
2282
+ "byteOffset": 17313792
2283
+ },
2284
+ {
2285
+ "name": "param_183",
2286
+ "shape": [
2287
+ 9216,
2288
+ 96
2289
+ ],
2290
+ "dtype": "float16",
2291
+ "format": "raw",
2292
+ "nbytes": 1769472,
2293
+ "byteOffset": 31469568
2294
+ }
2295
+ ],
2296
+ "md5sum": "662ba7267d5620fd903802819eeb9788"
2297
+ },
2298
+ {
2299
+ "dataPath": "params_shard_38.bin",
2300
+ "format": "raw-shard",
2301
+ "nbytes": 30474240,
2302
+ "records": [
2303
+ {
2304
+ "name": "param_184",
2305
+ "shape": [
2306
+ 3072,
2307
+ 384
2308
+ ],
2309
+ "dtype": "uint32",
2310
+ "format": "raw",
2311
+ "nbytes": 4718592,
2312
+ "byteOffset": 0
2313
+ },
2314
+ {
2315
+ "name": "param_185",
2316
+ "shape": [
2317
+ 3072,
2318
+ 96
2319
+ ],
2320
+ "dtype": "float16",
2321
+ "format": "raw",
2322
+ "nbytes": 589824,
2323
+ "byteOffset": 4718592
2324
+ },
2325
+ {
2326
+ "name": "param_186",
2327
+ "shape": [
2328
+ 16384,
2329
+ 384
2330
+ ],
2331
+ "dtype": "uint32",
2332
+ "format": "raw",
2333
+ "nbytes": 25165824,
2334
+ "byteOffset": 5308416
2335
+ }
2336
+ ],
2337
+ "md5sum": "7fca258deddd082906005d8c6b594562"
2338
+ },
2339
+ {
2340
+ "dataPath": "params_shard_39.bin",
2341
+ "format": "raw-shard",
2342
+ "nbytes": 33239040,
2343
+ "records": [
2344
+ {
2345
+ "name": "param_187",
2346
+ "shape": [
2347
+ 16384,
2348
+ 96
2349
+ ],
2350
+ "dtype": "float16",
2351
+ "format": "raw",
2352
+ "nbytes": 3145728,
2353
+ "byteOffset": 0
2354
+ },
2355
+ {
2356
+ "name": "param_188",
2357
+ "shape": [
2358
+ 3072,
2359
+ 1024
2360
+ ],
2361
+ "dtype": "uint32",
2362
+ "format": "raw",
2363
+ "nbytes": 12582912,
2364
+ "byteOffset": 3145728
2365
+ },
2366
+ {
2367
+ "name": "param_189",
2368
+ "shape": [
2369
+ 3072,
2370
+ 256
2371
+ ],
2372
+ "dtype": "float16",
2373
+ "format": "raw",
2374
+ "nbytes": 1572864,
2375
+ "byteOffset": 15728640
2376
+ },
2377
+ {
2378
+ "name": "param_190",
2379
+ "shape": [
2380
+ 3072
2381
+ ],
2382
+ "dtype": "float16",
2383
+ "format": "raw",
2384
+ "nbytes": 6144,
2385
+ "byteOffset": 17301504
2386
+ },
2387
+ {
2388
+ "name": "param_191",
2389
+ "shape": [
2390
+ 3072
2391
+ ],
2392
+ "dtype": "float16",
2393
+ "format": "raw",
2394
+ "nbytes": 6144,
2395
+ "byteOffset": 17307648
2396
+ },
2397
+ {
2398
+ "name": "param_192",
2399
+ "shape": [
2400
+ 9216,
2401
+ 384
2402
+ ],
2403
+ "dtype": "uint32",
2404
+ "format": "raw",
2405
+ "nbytes": 14155776,
2406
+ "byteOffset": 17313792
2407
+ },
2408
+ {
2409
+ "name": "param_193",
2410
+ "shape": [
2411
+ 9216,
2412
+ 96
2413
+ ],
2414
+ "dtype": "float16",
2415
+ "format": "raw",
2416
+ "nbytes": 1769472,
2417
+ "byteOffset": 31469568
2418
+ }
2419
+ ],
2420
+ "md5sum": "5bf417a7fac3087ed714131189075816"
2421
+ },
2422
+ {
2423
+ "dataPath": "params_shard_40.bin",
2424
+ "format": "raw-shard",
2425
+ "nbytes": 30474240,
2426
+ "records": [
2427
+ {
2428
+ "name": "param_194",
2429
+ "shape": [
2430
+ 3072,
2431
+ 384
2432
+ ],
2433
+ "dtype": "uint32",
2434
+ "format": "raw",
2435
+ "nbytes": 4718592,
2436
+ "byteOffset": 0
2437
+ },
2438
+ {
2439
+ "name": "param_195",
2440
+ "shape": [
2441
+ 3072,
2442
+ 96
2443
+ ],
2444
+ "dtype": "float16",
2445
+ "format": "raw",
2446
+ "nbytes": 589824,
2447
+ "byteOffset": 4718592
2448
+ },
2449
+ {
2450
+ "name": "param_196",
2451
+ "shape": [
2452
+ 16384,
2453
+ 384
2454
+ ],
2455
+ "dtype": "uint32",
2456
+ "format": "raw",
2457
+ "nbytes": 25165824,
2458
+ "byteOffset": 5308416
2459
+ }
2460
+ ],
2461
+ "md5sum": "c82817e7f5c165463d841e9a9c842997"
2462
+ },
2463
+ {
2464
+ "dataPath": "params_shard_41.bin",
2465
+ "format": "raw-shard",
2466
+ "nbytes": 33239040,
2467
+ "records": [
2468
+ {
2469
+ "name": "param_197",
2470
+ "shape": [
2471
+ 16384,
2472
+ 96
2473
+ ],
2474
+ "dtype": "float16",
2475
+ "format": "raw",
2476
+ "nbytes": 3145728,
2477
+ "byteOffset": 0
2478
+ },
2479
+ {
2480
+ "name": "param_198",
2481
+ "shape": [
2482
+ 3072,
2483
+ 1024
2484
+ ],
2485
+ "dtype": "uint32",
2486
+ "format": "raw",
2487
+ "nbytes": 12582912,
2488
+ "byteOffset": 3145728
2489
+ },
2490
+ {
2491
+ "name": "param_199",
2492
+ "shape": [
2493
+ 3072,
2494
+ 256
2495
+ ],
2496
+ "dtype": "float16",
2497
+ "format": "raw",
2498
+ "nbytes": 1572864,
2499
+ "byteOffset": 15728640
2500
+ },
2501
+ {
2502
+ "name": "param_200",
2503
+ "shape": [
2504
+ 3072
2505
+ ],
2506
+ "dtype": "float16",
2507
+ "format": "raw",
2508
+ "nbytes": 6144,
2509
+ "byteOffset": 17301504
2510
+ },
2511
+ {
2512
+ "name": "param_201",
2513
+ "shape": [
2514
+ 3072
2515
+ ],
2516
+ "dtype": "float16",
2517
+ "format": "raw",
2518
+ "nbytes": 6144,
2519
+ "byteOffset": 17307648
2520
+ },
2521
+ {
2522
+ "name": "param_202",
2523
+ "shape": [
2524
+ 9216,
2525
+ 384
2526
+ ],
2527
+ "dtype": "uint32",
2528
+ "format": "raw",
2529
+ "nbytes": 14155776,
2530
+ "byteOffset": 17313792
2531
+ },
2532
+ {
2533
+ "name": "param_203",
2534
+ "shape": [
2535
+ 9216,
2536
+ 96
2537
+ ],
2538
+ "dtype": "float16",
2539
+ "format": "raw",
2540
+ "nbytes": 1769472,
2541
+ "byteOffset": 31469568
2542
+ }
2543
+ ],
2544
+ "md5sum": "b05284a92d345b891b61d066f50d565b"
2545
+ },
2546
+ {
2547
+ "dataPath": "params_shard_42.bin",
2548
+ "format": "raw-shard",
2549
+ "nbytes": 30474240,
2550
+ "records": [
2551
+ {
2552
+ "name": "param_204",
2553
+ "shape": [
2554
+ 3072,
2555
+ 384
2556
+ ],
2557
+ "dtype": "uint32",
2558
+ "format": "raw",
2559
+ "nbytes": 4718592,
2560
+ "byteOffset": 0
2561
+ },
2562
+ {
2563
+ "name": "param_205",
2564
+ "shape": [
2565
+ 3072,
2566
+ 96
2567
+ ],
2568
+ "dtype": "float16",
2569
+ "format": "raw",
2570
+ "nbytes": 589824,
2571
+ "byteOffset": 4718592
2572
+ },
2573
+ {
2574
+ "name": "param_206",
2575
+ "shape": [
2576
+ 16384,
2577
+ 384
2578
+ ],
2579
+ "dtype": "uint32",
2580
+ "format": "raw",
2581
+ "nbytes": 25165824,
2582
+ "byteOffset": 5308416
2583
+ }
2584
+ ],
2585
+ "md5sum": "bfd684dbf1519a513ace0f048c2a39be"
2586
+ },
2587
+ {
2588
+ "dataPath": "params_shard_43.bin",
2589
+ "format": "raw-shard",
2590
+ "nbytes": 33239040,
2591
+ "records": [
2592
+ {
2593
+ "name": "param_207",
2594
+ "shape": [
2595
+ 16384,
2596
+ 96
2597
+ ],
2598
+ "dtype": "float16",
2599
+ "format": "raw",
2600
+ "nbytes": 3145728,
2601
+ "byteOffset": 0
2602
+ },
2603
+ {
2604
+ "name": "param_208",
2605
+ "shape": [
2606
+ 3072,
2607
+ 1024
2608
+ ],
2609
+ "dtype": "uint32",
2610
+ "format": "raw",
2611
+ "nbytes": 12582912,
2612
+ "byteOffset": 3145728
2613
+ },
2614
+ {
2615
+ "name": "param_209",
2616
+ "shape": [
2617
+ 3072,
2618
+ 256
2619
+ ],
2620
+ "dtype": "float16",
2621
+ "format": "raw",
2622
+ "nbytes": 1572864,
2623
+ "byteOffset": 15728640
2624
+ },
2625
+ {
2626
+ "name": "param_210",
2627
+ "shape": [
2628
+ 3072
2629
+ ],
2630
+ "dtype": "float16",
2631
+ "format": "raw",
2632
+ "nbytes": 6144,
2633
+ "byteOffset": 17301504
2634
+ },
2635
+ {
2636
+ "name": "param_211",
2637
+ "shape": [
2638
+ 3072
2639
+ ],
2640
+ "dtype": "float16",
2641
+ "format": "raw",
2642
+ "nbytes": 6144,
2643
+ "byteOffset": 17307648
2644
+ },
2645
+ {
2646
+ "name": "param_212",
2647
+ "shape": [
2648
+ 9216,
2649
+ 384
2650
+ ],
2651
+ "dtype": "uint32",
2652
+ "format": "raw",
2653
+ "nbytes": 14155776,
2654
+ "byteOffset": 17313792
2655
+ },
2656
+ {
2657
+ "name": "param_213",
2658
+ "shape": [
2659
+ 9216,
2660
+ 96
2661
+ ],
2662
+ "dtype": "float16",
2663
+ "format": "raw",
2664
+ "nbytes": 1769472,
2665
+ "byteOffset": 31469568
2666
+ }
2667
+ ],
2668
+ "md5sum": "815087a3375fae098120207cf73606b6"
2669
+ },
2670
+ {
2671
+ "dataPath": "params_shard_44.bin",
2672
+ "format": "raw-shard",
2673
+ "nbytes": 30474240,
2674
+ "records": [
2675
+ {
2676
+ "name": "param_214",
2677
+ "shape": [
2678
+ 3072,
2679
+ 384
2680
+ ],
2681
+ "dtype": "uint32",
2682
+ "format": "raw",
2683
+ "nbytes": 4718592,
2684
+ "byteOffset": 0
2685
+ },
2686
+ {
2687
+ "name": "param_215",
2688
+ "shape": [
2689
+ 3072,
2690
+ 96
2691
+ ],
2692
+ "dtype": "float16",
2693
+ "format": "raw",
2694
+ "nbytes": 589824,
2695
+ "byteOffset": 4718592
2696
+ },
2697
+ {
2698
+ "name": "param_216",
2699
+ "shape": [
2700
+ 16384,
2701
+ 384
2702
+ ],
2703
+ "dtype": "uint32",
2704
+ "format": "raw",
2705
+ "nbytes": 25165824,
2706
+ "byteOffset": 5308416
2707
+ }
2708
+ ],
2709
+ "md5sum": "5065ca3fd598a6582c10353f8a48f235"
2710
+ },
2711
+ {
2712
+ "dataPath": "params_shard_45.bin",
2713
+ "format": "raw-shard",
2714
+ "nbytes": 33239040,
2715
+ "records": [
2716
+ {
2717
+ "name": "param_217",
2718
+ "shape": [
2719
+ 16384,
2720
+ 96
2721
+ ],
2722
+ "dtype": "float16",
2723
+ "format": "raw",
2724
+ "nbytes": 3145728,
2725
+ "byteOffset": 0
2726
+ },
2727
+ {
2728
+ "name": "param_218",
2729
+ "shape": [
2730
+ 3072,
2731
+ 1024
2732
+ ],
2733
+ "dtype": "uint32",
2734
+ "format": "raw",
2735
+ "nbytes": 12582912,
2736
+ "byteOffset": 3145728
2737
+ },
2738
+ {
2739
+ "name": "param_219",
2740
+ "shape": [
2741
+ 3072,
2742
+ 256
2743
+ ],
2744
+ "dtype": "float16",
2745
+ "format": "raw",
2746
+ "nbytes": 1572864,
2747
+ "byteOffset": 15728640
2748
+ },
2749
+ {
2750
+ "name": "param_220",
2751
+ "shape": [
2752
+ 3072
2753
+ ],
2754
+ "dtype": "float16",
2755
+ "format": "raw",
2756
+ "nbytes": 6144,
2757
+ "byteOffset": 17301504
2758
+ },
2759
+ {
2760
+ "name": "param_221",
2761
+ "shape": [
2762
+ 3072
2763
+ ],
2764
+ "dtype": "float16",
2765
+ "format": "raw",
2766
+ "nbytes": 6144,
2767
+ "byteOffset": 17307648
2768
+ },
2769
+ {
2770
+ "name": "param_222",
2771
+ "shape": [
2772
+ 9216,
2773
+ 384
2774
+ ],
2775
+ "dtype": "uint32",
2776
+ "format": "raw",
2777
+ "nbytes": 14155776,
2778
+ "byteOffset": 17313792
2779
+ },
2780
+ {
2781
+ "name": "param_223",
2782
+ "shape": [
2783
+ 9216,
2784
+ 96
2785
+ ],
2786
+ "dtype": "float16",
2787
+ "format": "raw",
2788
+ "nbytes": 1769472,
2789
+ "byteOffset": 31469568
2790
+ }
2791
+ ],
2792
+ "md5sum": "bdb40b4e92059de1100895fd5336fb7c"
2793
+ },
2794
+ {
2795
+ "dataPath": "params_shard_46.bin",
2796
+ "format": "raw-shard",
2797
+ "nbytes": 30474240,
2798
+ "records": [
2799
+ {
2800
+ "name": "param_224",
2801
+ "shape": [
2802
+ 3072,
2803
+ 384
2804
+ ],
2805
+ "dtype": "uint32",
2806
+ "format": "raw",
2807
+ "nbytes": 4718592,
2808
+ "byteOffset": 0
2809
+ },
2810
+ {
2811
+ "name": "param_225",
2812
+ "shape": [
2813
+ 3072,
2814
+ 96
2815
+ ],
2816
+ "dtype": "float16",
2817
+ "format": "raw",
2818
+ "nbytes": 589824,
2819
+ "byteOffset": 4718592
2820
+ },
2821
+ {
2822
+ "name": "param_226",
2823
+ "shape": [
2824
+ 16384,
2825
+ 384
2826
+ ],
2827
+ "dtype": "uint32",
2828
+ "format": "raw",
2829
+ "nbytes": 25165824,
2830
+ "byteOffset": 5308416
2831
+ }
2832
+ ],
2833
+ "md5sum": "7a8e6878b7e620871f7b65301ec72550"
2834
+ },
2835
+ {
2836
+ "dataPath": "params_shard_47.bin",
2837
+ "format": "raw-shard",
2838
+ "nbytes": 33239040,
2839
+ "records": [
2840
+ {
2841
+ "name": "param_227",
2842
+ "shape": [
2843
+ 16384,
2844
+ 96
2845
+ ],
2846
+ "dtype": "float16",
2847
+ "format": "raw",
2848
+ "nbytes": 3145728,
2849
+ "byteOffset": 0
2850
+ },
2851
+ {
2852
+ "name": "param_228",
2853
+ "shape": [
2854
+ 3072,
2855
+ 1024
2856
+ ],
2857
+ "dtype": "uint32",
2858
+ "format": "raw",
2859
+ "nbytes": 12582912,
2860
+ "byteOffset": 3145728
2861
+ },
2862
+ {
2863
+ "name": "param_229",
2864
+ "shape": [
2865
+ 3072,
2866
+ 256
2867
+ ],
2868
+ "dtype": "float16",
2869
+ "format": "raw",
2870
+ "nbytes": 1572864,
2871
+ "byteOffset": 15728640
2872
+ },
2873
+ {
2874
+ "name": "param_230",
2875
+ "shape": [
2876
+ 3072
2877
+ ],
2878
+ "dtype": "float16",
2879
+ "format": "raw",
2880
+ "nbytes": 6144,
2881
+ "byteOffset": 17301504
2882
+ },
2883
+ {
2884
+ "name": "param_231",
2885
+ "shape": [
2886
+ 3072
2887
+ ],
2888
+ "dtype": "float16",
2889
+ "format": "raw",
2890
+ "nbytes": 6144,
2891
+ "byteOffset": 17307648
2892
+ },
2893
+ {
2894
+ "name": "param_232",
2895
+ "shape": [
2896
+ 9216,
2897
+ 384
2898
+ ],
2899
+ "dtype": "uint32",
2900
+ "format": "raw",
2901
+ "nbytes": 14155776,
2902
+ "byteOffset": 17313792
2903
+ },
2904
+ {
2905
+ "name": "param_233",
2906
+ "shape": [
2907
+ 9216,
2908
+ 96
2909
+ ],
2910
+ "dtype": "float16",
2911
+ "format": "raw",
2912
+ "nbytes": 1769472,
2913
+ "byteOffset": 31469568
2914
+ }
2915
+ ],
2916
+ "md5sum": "c4867c41c853d1d3c30bc04aa840956b"
2917
+ },
2918
+ {
2919
+ "dataPath": "params_shard_48.bin",
2920
+ "format": "raw-shard",
2921
+ "nbytes": 30474240,
2922
+ "records": [
2923
+ {
2924
+ "name": "param_234",
2925
+ "shape": [
2926
+ 3072,
2927
+ 384
2928
+ ],
2929
+ "dtype": "uint32",
2930
+ "format": "raw",
2931
+ "nbytes": 4718592,
2932
+ "byteOffset": 0
2933
+ },
2934
+ {
2935
+ "name": "param_235",
2936
+ "shape": [
2937
+ 3072,
2938
+ 96
2939
+ ],
2940
+ "dtype": "float16",
2941
+ "format": "raw",
2942
+ "nbytes": 589824,
2943
+ "byteOffset": 4718592
2944
+ },
2945
+ {
2946
+ "name": "param_236",
2947
+ "shape": [
2948
+ 16384,
2949
+ 384
2950
+ ],
2951
+ "dtype": "uint32",
2952
+ "format": "raw",
2953
+ "nbytes": 25165824,
2954
+ "byteOffset": 5308416
2955
+ }
2956
+ ],
2957
+ "md5sum": "a80e5c1d5f2df058f023a47d703174a3"
2958
+ },
2959
+ {
2960
+ "dataPath": "params_shard_49.bin",
2961
+ "format": "raw-shard",
2962
+ "nbytes": 75595776,
2963
+ "records": [
2964
+ {
2965
+ "name": "param_243",
2966
+ "shape": [
2967
+ 49216,
2968
+ 384
2969
+ ],
2970
+ "dtype": "uint32",
2971
+ "format": "raw",
2972
+ "nbytes": 75595776,
2973
+ "byteOffset": 0
2974
+ }
2975
+ ],
2976
+ "md5sum": "3fd26837d3b6d618b756bb755cda1b4e"
2977
+ },
2978
+ {
2979
+ "dataPath": "params_shard_50.bin",
2980
+ "format": "raw-shard",
2981
+ "nbytes": 27817984,
2982
+ "records": [
2983
+ {
2984
+ "name": "param_237",
2985
+ "shape": [
2986
+ 16384,
2987
+ 96
2988
+ ],
2989
+ "dtype": "float16",
2990
+ "format": "raw",
2991
+ "nbytes": 3145728,
2992
+ "byteOffset": 0
2993
+ },
2994
+ {
2995
+ "name": "param_238",
2996
+ "shape": [
2997
+ 3072,
2998
+ 1024
2999
+ ],
3000
+ "dtype": "uint32",
3001
+ "format": "raw",
3002
+ "nbytes": 12582912,
3003
+ "byteOffset": 3145728
3004
+ },
3005
+ {
3006
+ "name": "param_239",
3007
+ "shape": [
3008
+ 3072,
3009
+ 256
3010
+ ],
3011
+ "dtype": "float16",
3012
+ "format": "raw",
3013
+ "nbytes": 1572864,
3014
+ "byteOffset": 15728640
3015
+ },
3016
+ {
3017
+ "name": "param_240",
3018
+ "shape": [
3019
+ 3072
3020
+ ],
3021
+ "dtype": "float16",
3022
+ "format": "raw",
3023
+ "nbytes": 6144,
3024
+ "byteOffset": 17301504
3025
+ },
3026
+ {
3027
+ "name": "param_241",
3028
+ "shape": [
3029
+ 3072
3030
+ ],
3031
+ "dtype": "float16",
3032
+ "format": "raw",
3033
+ "nbytes": 6144,
3034
+ "byteOffset": 17307648
3035
+ },
3036
+ {
3037
+ "name": "param_242",
3038
+ "shape": [
3039
+ 3072
3040
+ ],
3041
+ "dtype": "float16",
3042
+ "format": "raw",
3043
+ "nbytes": 6144,
3044
+ "byteOffset": 17313792
3045
+ },
3046
+ {
3047
+ "name": "param_244",
3048
+ "shape": [
3049
+ 49216,
3050
+ 96
3051
+ ],
3052
+ "dtype": "float16",
3053
+ "format": "raw",
3054
+ "nbytes": 9449472,
3055
+ "byteOffset": 17319936
3056
+ },
3057
+ {
3058
+ "name": "param_245",
3059
+ "shape": [
3060
+ 2048,
3061
+ 128
3062
+ ],
3063
+ "dtype": "float16",
3064
+ "format": "raw",
3065
+ "nbytes": 524288,
3066
+ "byteOffset": 26769408
3067
+ },
3068
+ {
3069
+ "name": "param_246",
3070
+ "shape": [
3071
+ 2048,
3072
+ 128
3073
+ ],
3074
+ "dtype": "float16",
3075
+ "format": "raw",
3076
+ "nbytes": 524288,
3077
+ "byteOffset": 27293696
3078
+ }
3079
+ ],
3080
+ "md5sum": "5703a84f0113a93f65e213357ebc5125"
3081
+ }
3082
+ ]
3083
+ }
params/params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0caf48925d559d45ea56008e06dd0386045c3a87fd99a2ccd68c87d6a1adb16c
3
+ size 75595776
params/params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be4180f1dd651a31ecab054ca84f3d9ac1d8c3a2b4060002decc542e3bdf574c
3
+ size 25165824
params/params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69a1a4ba16d1487be929512c77d0e9f90ebb0ded887ceb129ff5fed966c01e11
3
+ size 30474240
params/params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fe474254a011af63ea72f90f651988b9f2b6a2e598338e8f60ce5a71a1616a1
3
+ size 33239040
params/params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e84b43e89595b1c94e8f3a3cb9a8ae8329c08ae7fe7ac4db5a3c54dd82e4a7b
3
+ size 30474240
params/params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:321a5d197c848f83b48845ce899fcac43aa69743646aba5ec0eb193c2a8d6fb2
3
+ size 33239040
params/params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3bff37f22d9bc445c7240351b326b36715915a2537a0ccc6faea42c697faf83
3
+ size 30474240
params/params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:119d722f35281cc08bcf696906083e75e50fec1f1e37677201f717da065ba9ba
3
+ size 33239040
params/params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:120dd3921fb1102e1fa844e70fe3b60d7718dbb9337ccded4d35d1079f9775e2
3
+ size 30474240
params/params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b78180a17c1556ab28df9bb45814101e6a41445c7502a82f7478e9e3690790
3
+ size 33239040
params/params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:356b72f0f831c7d952ac2a049d8ab8067e81069eab0f3682ea68f80032d078dc
3
+ size 30474240
params/params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:297ee9af15309ea77d34ea016124500d631c37a4bb6dd7d2375e775a622a8b40
3
+ size 33239040
params/params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4ad2a9aedd32044da876115bc60c0f99113562933b05609dda72c045d8aa183
3
+ size 30683136
params/params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f985cdfa0b2f2704d4a6a6f0ac3d39e5acc3eb6bed9e68d9d14e2af24d96a6da
3
+ size 30474240
params/params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a209815fe5bec279be92bc4f1642b922d51e22ba370201f3513ad156523d349
3
+ size 33239040
params/params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7657e75745c898223a1e20a143ba15b10dc6d95b2970c88f807c1b5ec25f3c71
3
+ size 30474240
params/params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:871af80b5fb179617bba17dcfa0a5ebb335b728b6df7f4db7ddc78b32b6ce9c6
3
+ size 33239040
params/params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6a1c9cfbe373441f7d926f48253e56309420cfe6a90a71c4ccf491778646f2b
3
+ size 30474240
params/params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e8ae18626cf9ceb4eeac399bb9ffa3a301b758aac654bc44f011b5de2110e53
3
+ size 33239040
params/params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fed0f45c57f45303a982edd969bba27cf13e2043175d5923af8bd42e238be12
3
+ size 30474240
params/params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c728d54e6f009d1e61cfd81446ac1c447db26fbb818600430dca819c65e1a800
3
+ size 33239040
params/params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e516688a4fdedaca17b06ead13655c8c52e24cc977e4d2cbd9e58150e570c74
3
+ size 30474240
params/params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae1c968b723e32fb08892c666a28bd5d4a5be1f4478e3a90fb5ff311b40b1afe
3
+ size 33239040
params/params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:798f70307ff7f264cb772d377bbd96d3ce0b0380a667eada383e9e8f92670886
3
+ size 33239040
params/params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fa3fa67d55ed83f32fa183cebd5026014b178db4b94a8968feee47aa6157922
3
+ size 30474240
params/params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a29072b0947d2b1451c5649b9f67d5fbdac9d55a098d7682b02af3263179d00
3
+ size 33239040
params/params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d764a0fdb9faeb153c1cf25a0e795a87963adf28f2c5ce30b2df5f3a49df8d2
3
+ size 30474240
params/params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a06ab40892dde63b328e1d7190bb933fb21cd4392f22f061dc83dfb83154ad3a
3
+ size 33239040
params/params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28368c97d8dae349e2ccfdbdbdcfc0bdc4241d1332358f4a7790e9e438254e85
3
+ size 30474240
params/params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9816d110a71deed28c3aa457d4cc99a90ba77194d413cc089e7a80a3706f3cd3
3
+ size 33239040
params/params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8da18acfd2d709bb774e291169d9e6bb56ba5acb7698dac5985284ddbd46940
3
+ size 30474240
params/params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30363bdb013d0d9ab1b65172221319421ceecc9851300b516a8d3edb63876fcd
3
+ size 33239040
params/params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cec2b7d9777cab28f22c81abfdb96e0d9a9909c5ca31aa9b1d313c150eb49409
3
+ size 30474240
params/params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5af4dbb6b91907a8a50a341fae042f3245b3060ba3021ed9e776e271167c3711
3
+ size 33239040
params/params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b64c1fee332205732a44ee123da07ec451c2c2cd630ca7d89bb3c2dda91ae17
3
+ size 30474240
params/params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df98b68ba04cf44d7dbd6a93eb7e75ed8925d38b3f62ec1be1090a1ba29d28c4
3
+ size 30474240
params/params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b18550de5b27e6f126bdc691e9c52ad6cd7c893e77942cace19d3aeef5f36537
3
+ size 33239040
params/params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5069df66406c3e1eb38aec32b59c0c4c14c078690b925fe7a60eedd8a7802c20
3
+ size 30474240
params/params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8022e0f117e0ffe2a57ca3cd5d87357dce8c2bee15edc764ee93e0021bb912fc
3
+ size 33239040
params/params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4681fbd23b376b455b97b6c07fd6f21938be64b31c15590802613ed230a060a8
3
+ size 30474240
params/params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d205b22e462a0c5fcb99b9d4e7a1b550b4b7d3414ec46f3620ad65b9e25ceab7
3
+ size 33239040
params/params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76393b282df931dc149a5ba719da464ee1e1ef4122043e10b994591270bbd153
3
+ size 30474240
params/params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b23f3e7bac75d7f235434659e76f81afd3737d6709797fa1718928c6ee23cd8
3
+ size 33239040
params/params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d03a2d01dccc152fcecb06f8c92111828caac38993cd0723072f5ca6633a310
3
+ size 30474240