Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:214b1fa78ca8fc15df64fbfa2a719b3cf5e174531e74c3c61e08d4f480aa4e57
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d632634bd583b085bc7ead7165257c3975b6129df5d046a6de02f3517b0cd8ae
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:767d5169a502b333e41fef10e91d335a077843e5d763d5edf0f62d19b6910535
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ce8b17b9b8820c16b4e174f1f2d56c3bdb9cef3af473fbc61f0fd2fc24c387a
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -3,3 +3,8 @@
|
|
3 |
{"current_steps": 30, "total_steps": 117, "loss": 1.0175, "lr": 5e-06, "epoch": 0.7692307692307693, "percentage": 25.64, "elapsed_time": "0:15:54", "remaining_time": "0:46:08"}
|
4 |
{"current_steps": 39, "total_steps": 117, "eval_loss": 0.9853456020355225, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:21:05", "remaining_time": "0:42:10"}
|
5 |
{"current_steps": 40, "total_steps": 117, "loss": 0.987, "lr": 5e-06, "epoch": 1.0256410256410255, "percentage": 34.19, "elapsed_time": "0:22:45", "remaining_time": "0:43:48"}
|
|
|
|
|
|
|
|
|
|
|
|
3 |
{"current_steps": 30, "total_steps": 117, "loss": 1.0175, "lr": 5e-06, "epoch": 0.7692307692307693, "percentage": 25.64, "elapsed_time": "0:15:54", "remaining_time": "0:46:08"}
|
4 |
{"current_steps": 39, "total_steps": 117, "eval_loss": 0.9853456020355225, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:21:05", "remaining_time": "0:42:10"}
|
5 |
{"current_steps": 40, "total_steps": 117, "loss": 0.987, "lr": 5e-06, "epoch": 1.0256410256410255, "percentage": 34.19, "elapsed_time": "0:22:45", "remaining_time": "0:43:48"}
|
6 |
+
{"current_steps": 50, "total_steps": 117, "loss": 0.939, "lr": 5e-06, "epoch": 1.282051282051282, "percentage": 42.74, "elapsed_time": "0:28:01", "remaining_time": "0:37:33"}
|
7 |
+
{"current_steps": 60, "total_steps": 117, "loss": 0.9251, "lr": 5e-06, "epoch": 1.5384615384615383, "percentage": 51.28, "elapsed_time": "0:33:17", "remaining_time": "0:31:38"}
|
8 |
+
{"current_steps": 70, "total_steps": 117, "loss": 0.9218, "lr": 5e-06, "epoch": 1.7948717948717947, "percentage": 59.83, "elapsed_time": "0:38:33", "remaining_time": "0:25:53"}
|
9 |
+
{"current_steps": 78, "total_steps": 117, "eval_loss": 0.9502609372138977, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:43:11", "remaining_time": "0:21:35"}
|
10 |
+
{"current_steps": 80, "total_steps": 117, "loss": 0.905, "lr": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "0:45:31", "remaining_time": "0:21:03"}
|