Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:002d107608c7826a92d5ae8fce67a4f6e5aa8a0f467166212b8ba266aac65849
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2e9bf29c7ae4e21d29a444d37b6d25cba22b6956008a2d8f62b205eca22b26
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71bdd312318a4e8be7a1364cc8f1a3ca4737c15ac2006ddac7e0ec9431a7cd0a
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:453419b7857ca38e1a81dec44c26dd0a4122bace0875f6271e643bd72668b555
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -11,3 +11,10 @@
|
|
11 |
{"current_steps": 100, "total_steps": 165, "loss": 0.5526, "lr": 5e-06, "epoch": 1.8058690744920993, "percentage": 60.61, "elapsed_time": "0:55:15", "remaining_time": "0:35:54"}
|
12 |
{"current_steps": 110, "total_steps": 165, "loss": 0.5525, "lr": 5e-06, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:00:34", "remaining_time": "0:30:17"}
|
13 |
{"current_steps": 110, "total_steps": 165, "eval_loss": 0.5813493132591248, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:01:33", "remaining_time": "0:30:46"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11 |
{"current_steps": 100, "total_steps": 165, "loss": 0.5526, "lr": 5e-06, "epoch": 1.8058690744920993, "percentage": 60.61, "elapsed_time": "0:55:15", "remaining_time": "0:35:54"}
|
12 |
{"current_steps": 110, "total_steps": 165, "loss": 0.5525, "lr": 5e-06, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:00:34", "remaining_time": "0:30:17"}
|
13 |
{"current_steps": 110, "total_steps": 165, "eval_loss": 0.5813493132591248, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:01:33", "remaining_time": "0:30:46"}
|
14 |
+
{"current_steps": 120, "total_steps": 165, "loss": 0.549, "lr": 5e-06, "epoch": 2.1670428893905194, "percentage": 72.73, "elapsed_time": "1:07:49", "remaining_time": "0:25:26"}
|
15 |
+
{"current_steps": 130, "total_steps": 165, "loss": 0.5085, "lr": 5e-06, "epoch": 2.3476297968397293, "percentage": 78.79, "elapsed_time": "1:13:11", "remaining_time": "0:19:42"}
|
16 |
+
{"current_steps": 140, "total_steps": 165, "loss": 0.5079, "lr": 5e-06, "epoch": 2.528216704288939, "percentage": 84.85, "elapsed_time": "1:18:32", "remaining_time": "0:14:01"}
|
17 |
+
{"current_steps": 150, "total_steps": 165, "loss": 0.5073, "lr": 5e-06, "epoch": 2.708803611738149, "percentage": 90.91, "elapsed_time": "1:23:54", "remaining_time": "0:08:23"}
|
18 |
+
{"current_steps": 160, "total_steps": 165, "loss": 0.5138, "lr": 5e-06, "epoch": 2.889390519187359, "percentage": 96.97, "elapsed_time": "1:29:15", "remaining_time": "0:02:47"}
|
19 |
+
{"current_steps": 165, "total_steps": 165, "eval_loss": 0.5825901627540588, "epoch": 2.979683972911964, "percentage": 100.0, "elapsed_time": "1:33:52", "remaining_time": "0:00:00"}
|
20 |
+
{"current_steps": 165, "total_steps": 165, "epoch": 2.979683972911964, "percentage": 100.0, "elapsed_time": "1:35:05", "remaining_time": "0:00:00"}
|