Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04729f52398e656bc4153539d9600ca134619822d7e0fa49211dec97ef65c983
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f3998d59373d9eda192f9146f0dd3f69baa9fb01d48913642987dcfaac882c4
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77aca4d0fe7ad5f09b90437841cfe450969e7c83ed2483e5ffb37857bbb8e23d
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60604f00a5ef0646b955e367bb0d61e62d157e27d1256a9d9b1d66e128dfbca1
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -6,3 +6,8 @@
|
|
6 |
{"current_steps": 50, "total_steps": 90, "loss": 0.8022, "lr": 5e-06, "epoch": 1.639676113360324, "percentage": 55.56, "elapsed_time": "0:49:30", "remaining_time": "0:39:36"}
|
7 |
{"current_steps": 60, "total_steps": 90, "loss": 0.7929, "lr": 5e-06, "epoch": 1.9635627530364372, "percentage": 66.67, "elapsed_time": "0:59:03", "remaining_time": "0:29:31"}
|
8 |
{"current_steps": 60, "total_steps": 90, "eval_loss": 0.8138453960418701, "epoch": 1.9635627530364372, "percentage": 66.67, "elapsed_time": "1:00:02", "remaining_time": "0:30:01"}
|
|
|
|
|
|
|
|
|
|
|
|
6 |
{"current_steps": 50, "total_steps": 90, "loss": 0.8022, "lr": 5e-06, "epoch": 1.639676113360324, "percentage": 55.56, "elapsed_time": "0:49:30", "remaining_time": "0:39:36"}
|
7 |
{"current_steps": 60, "total_steps": 90, "loss": 0.7929, "lr": 5e-06, "epoch": 1.9635627530364372, "percentage": 66.67, "elapsed_time": "0:59:03", "remaining_time": "0:29:31"}
|
8 |
{"current_steps": 60, "total_steps": 90, "eval_loss": 0.8138453960418701, "epoch": 1.9635627530364372, "percentage": 66.67, "elapsed_time": "1:00:02", "remaining_time": "0:30:01"}
|
9 |
+
{"current_steps": 70, "total_steps": 90, "loss": 0.8051, "lr": 5e-06, "epoch": 2.3076923076923075, "percentage": 77.78, "elapsed_time": "1:10:21", "remaining_time": "0:20:06"}
|
10 |
+
{"current_steps": 80, "total_steps": 90, "loss": 0.7367, "lr": 5e-06, "epoch": 2.6315789473684212, "percentage": 88.89, "elapsed_time": "1:19:54", "remaining_time": "0:09:59"}
|
11 |
+
{"current_steps": 90, "total_steps": 90, "loss": 0.728, "lr": 5e-06, "epoch": 2.9554655870445345, "percentage": 100.0, "elapsed_time": "1:29:25", "remaining_time": "0:00:00"}
|
12 |
+
{"current_steps": 90, "total_steps": 90, "eval_loss": 0.8001113533973694, "epoch": 2.9554655870445345, "percentage": 100.0, "elapsed_time": "1:31:10", "remaining_time": "0:00:00"}
|
13 |
+
{"current_steps": 90, "total_steps": 90, "epoch": 2.9554655870445345, "percentage": 100.0, "elapsed_time": "1:32:24", "remaining_time": "0:00:00"}
|