Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84cc546ea88454b30ea0b32cd0f00f215939150cc60dfb2d75cf3febf9e88366
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8ab5d0e4a635af5a4c445297a1b8d3f18d50e635fbee057ae5847e707f28ac4
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1009fab4e5c6f7bea720958b4ad4874b8e34cd8859ba166f9bc30cdb6249fcc
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4cd0aaf8d5c7ecf6c1ff628cd6c6e9ec4a149a10bbb141822056f17c629e0a4
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -2,3 +2,7 @@
|
|
2 |
{"current_steps": 20, "total_steps": 93, "loss": 0.4778, "lr": 5e-06, "epoch": 0.6299212598425197, "percentage": 21.51, "elapsed_time": "0:19:16", "remaining_time": "1:10:20"}
|
3 |
{"current_steps": 30, "total_steps": 93, "loss": 0.4472, "lr": 5e-06, "epoch": 0.9448818897637795, "percentage": 32.26, "elapsed_time": "0:28:53", "remaining_time": "1:00:39"}
|
4 |
{"current_steps": 31, "total_steps": 93, "eval_loss": 0.43012088537216187, "epoch": 0.9763779527559056, "percentage": 33.33, "elapsed_time": "0:30:33", "remaining_time": "1:01:06"}
|
|
|
|
|
|
|
|
|
|
2 |
{"current_steps": 20, "total_steps": 93, "loss": 0.4778, "lr": 5e-06, "epoch": 0.6299212598425197, "percentage": 21.51, "elapsed_time": "0:19:16", "remaining_time": "1:10:20"}
|
3 |
{"current_steps": 30, "total_steps": 93, "loss": 0.4472, "lr": 5e-06, "epoch": 0.9448818897637795, "percentage": 32.26, "elapsed_time": "0:28:53", "remaining_time": "1:00:39"}
|
4 |
{"current_steps": 31, "total_steps": 93, "eval_loss": 0.43012088537216187, "epoch": 0.9763779527559056, "percentage": 33.33, "elapsed_time": "0:30:33", "remaining_time": "1:01:06"}
|
5 |
+
{"current_steps": 40, "total_steps": 93, "loss": 0.4667, "lr": 5e-06, "epoch": 1.279527559055118, "percentage": 43.01, "elapsed_time": "0:40:12", "remaining_time": "0:53:17"}
|
6 |
+
{"current_steps": 50, "total_steps": 93, "loss": 0.4113, "lr": 5e-06, "epoch": 1.594488188976378, "percentage": 53.76, "elapsed_time": "0:49:49", "remaining_time": "0:42:51"}
|
7 |
+
{"current_steps": 60, "total_steps": 93, "loss": 0.4167, "lr": 5e-06, "epoch": 1.909448818897638, "percentage": 64.52, "elapsed_time": "0:59:28", "remaining_time": "0:32:42"}
|
8 |
+
{"current_steps": 62, "total_steps": 93, "eval_loss": 0.4076673686504364, "epoch": 1.9724409448818898, "percentage": 66.67, "elapsed_time": "1:02:13", "remaining_time": "0:31:06"}
|