Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df1188a1f66cc7ecdaeb75880bf3e1ccb3a4328a5a3c0539ff6b4ef1a218ccf8
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:946bfb7458bb2ba40f9d9befac496a9f1350e210181df1708ab4138bb6332e3b
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2123827a0fea800eda0959c91db82e668e2d5b46b2ddf59991bf9c3527e2390b
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f6fa50a108df059b233586abd1edbb9b659148ef83b6e25da1c23d61e83bd34
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -1,3 +1,7 @@
|
|
1 |
{"current_steps": 10, "total_steps": 81, "loss": 1.224, "lr": 5e-06, "epoch": 0.3595505617977528, "percentage": 12.35, "elapsed_time": "0:23:24", "remaining_time": "2:46:10"}
|
2 |
{"current_steps": 20, "total_steps": 81, "loss": 1.1104, "lr": 5e-06, "epoch": 0.7191011235955056, "percentage": 24.69, "elapsed_time": "0:46:42", "remaining_time": "2:22:27"}
|
3 |
{"current_steps": 27, "total_steps": 81, "eval_loss": 1.065308928489685, "epoch": 0.9707865168539326, "percentage": 33.33, "elapsed_time": "1:06:07", "remaining_time": "2:12:14"}
|
|
|
|
|
|
|
|
|
|
1 |
{"current_steps": 10, "total_steps": 81, "loss": 1.224, "lr": 5e-06, "epoch": 0.3595505617977528, "percentage": 12.35, "elapsed_time": "0:23:24", "remaining_time": "2:46:10"}
|
2 |
{"current_steps": 20, "total_steps": 81, "loss": 1.1104, "lr": 5e-06, "epoch": 0.7191011235955056, "percentage": 24.69, "elapsed_time": "0:46:42", "remaining_time": "2:22:27"}
|
3 |
{"current_steps": 27, "total_steps": 81, "eval_loss": 1.065308928489685, "epoch": 0.9707865168539326, "percentage": 33.33, "elapsed_time": "1:06:07", "remaining_time": "2:12:14"}
|
4 |
+
{"current_steps": 30, "total_steps": 81, "loss": 1.0655, "lr": 5e-06, "epoch": 1.0786516853932584, "percentage": 37.04, "elapsed_time": "1:12:35", "remaining_time": "2:03:24"}
|
5 |
+
{"current_steps": 40, "total_steps": 81, "loss": 1.0192, "lr": 5e-06, "epoch": 1.4382022471910112, "percentage": 49.38, "elapsed_time": "1:35:52", "remaining_time": "1:38:16"}
|
6 |
+
{"current_steps": 50, "total_steps": 81, "loss": 1.0003, "lr": 5e-06, "epoch": 1.797752808988764, "percentage": 61.73, "elapsed_time": "1:59:10", "remaining_time": "1:13:53"}
|
7 |
+
{"current_steps": 55, "total_steps": 81, "eval_loss": 1.020365595817566, "epoch": 1.9775280898876404, "percentage": 67.9, "elapsed_time": "2:13:28", "remaining_time": "1:03:06"}
|