Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02e09101618d8a65bf5f323617ad060a20ce61b4f5e40cc64db678fe74fe4459
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40a0d9d07beab43304dc7a979951d1019dac734c2125d450af7768d8d97efd0b
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3640111d635af666a7005a8d4c5669beab90da72843de9d58daa19327a01936b
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e086d638e2f23fb287685293ee9026ea34c7321e92d98612a10f4c82f4cc5e02
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -13,3 +13,11 @@
|
|
13 |
{"current_steps": 120, "total_steps": 198, "loss": 0.6786, "lr": 5e-06, "epoch": 1.8045112781954886, "percentage": 60.61, "elapsed_time": "1:58:52", "remaining_time": "1:17:16"}
|
14 |
{"current_steps": 130, "total_steps": 198, "loss": 0.6668, "lr": 5e-06, "epoch": 1.954887218045113, "percentage": 65.66, "elapsed_time": "2:08:34", "remaining_time": "1:07:15"}
|
15 |
{"current_steps": 133, "total_steps": 198, "eval_loss": 0.7167445421218872, "epoch": 2.0, "percentage": 67.17, "elapsed_time": "2:12:35", "remaining_time": "1:04:48"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
13 |
{"current_steps": 120, "total_steps": 198, "loss": 0.6786, "lr": 5e-06, "epoch": 1.8045112781954886, "percentage": 60.61, "elapsed_time": "1:58:52", "remaining_time": "1:17:16"}
|
14 |
{"current_steps": 130, "total_steps": 198, "loss": 0.6668, "lr": 5e-06, "epoch": 1.954887218045113, "percentage": 65.66, "elapsed_time": "2:08:34", "remaining_time": "1:07:15"}
|
15 |
{"current_steps": 133, "total_steps": 198, "eval_loss": 0.7167445421218872, "epoch": 2.0, "percentage": 67.17, "elapsed_time": "2:12:35", "remaining_time": "1:04:48"}
|
16 |
+
{"current_steps": 140, "total_steps": 198, "loss": 0.6702, "lr": 5e-06, "epoch": 2.1052631578947367, "percentage": 70.71, "elapsed_time": "2:20:35", "remaining_time": "0:58:14"}
|
17 |
+
{"current_steps": 150, "total_steps": 198, "loss": 0.6221, "lr": 5e-06, "epoch": 2.255639097744361, "percentage": 75.76, "elapsed_time": "2:30:17", "remaining_time": "0:48:05"}
|
18 |
+
{"current_steps": 160, "total_steps": 198, "loss": 0.6227, "lr": 5e-06, "epoch": 2.406015037593985, "percentage": 80.81, "elapsed_time": "2:40:00", "remaining_time": "0:38:00"}
|
19 |
+
{"current_steps": 170, "total_steps": 198, "loss": 0.625, "lr": 5e-06, "epoch": 2.556390977443609, "percentage": 85.86, "elapsed_time": "2:49:44", "remaining_time": "0:27:57"}
|
20 |
+
{"current_steps": 180, "total_steps": 198, "loss": 0.6189, "lr": 5e-06, "epoch": 2.706766917293233, "percentage": 90.91, "elapsed_time": "2:59:28", "remaining_time": "0:17:56"}
|
21 |
+
{"current_steps": 190, "total_steps": 198, "loss": 0.6284, "lr": 5e-06, "epoch": 2.857142857142857, "percentage": 95.96, "elapsed_time": "3:09:12", "remaining_time": "0:07:57"}
|
22 |
+
{"current_steps": 198, "total_steps": 198, "eval_loss": 0.7185549139976501, "epoch": 2.9774436090225564, "percentage": 100.0, "elapsed_time": "3:19:23", "remaining_time": "0:00:00"}
|
23 |
+
{"current_steps": 198, "total_steps": 198, "epoch": 2.9774436090225564, "percentage": 100.0, "elapsed_time": "3:20:39", "remaining_time": "0:00:00"}
|