Upload README.md with huggingface_hub
Browse files
README.md
CHANGED
@@ -74,7 +74,7 @@ eval_table_size:
|
|
74 |
saves_per_epoch: 4
|
75 |
save_total_limit: 8
|
76 |
debug:
|
77 |
-
deepspeed:
|
78 |
weight_decay: 0.0
|
79 |
fsdp:
|
80 |
fsdp_config:
|
@@ -90,7 +90,7 @@ tokens:
|
|
90 |
|
91 |
</details><br>
|
92 |
|
93 |
-
#
|
94 |
|
95 |
This model was trained from scratch on the None dataset.
|
96 |
|
|
|
74 |
saves_per_epoch: 4
|
75 |
save_total_limit: 8
|
76 |
debug:
|
77 |
+
deepspeed: deepspeed/zero2.json
|
78 |
weight_decay: 0.0
|
79 |
fsdp:
|
80 |
fsdp_config:
|
|
|
90 |
|
91 |
</details><br>
|
92 |
|
93 |
+
# llama-8B-fft
|
94 |
|
95 |
This model was trained from scratch on the None dataset.
|
96 |
|