Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f3dad0a26aea98709f4868c9d9f791d25b61b94cee3bed41983db7822afb93a
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d2760249711ebf5e9dcd4e9df10a3776769493c14ea2b70a9123ae1b8cba2a7
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:919997a6ee7e79f6f144f19cbe4577a08c0106c47646515d648224354eb1a15c
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8beb3db21848b4254d2e32b46ee1cf963972d726cc1dc66fe9337d141eec07e0
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -10,3 +10,10 @@
|
|
10 |
{"current_steps": 90, "total_steps": 150, "loss": 0.5397, "lr": 5e-06, "epoch": 1.7955112219451372, "percentage": 60.0, "elapsed_time": "1:26:57", "remaining_time": "0:57:58"}
|
11 |
{"current_steps": 100, "total_steps": 150, "loss": 0.5438, "lr": 5e-06, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:36:23", "remaining_time": "0:48:11"}
|
12 |
{"current_steps": 100, "total_steps": 150, "eval_loss": 0.5740869641304016, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:37:29", "remaining_time": "0:48:44"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
{"current_steps": 90, "total_steps": 150, "loss": 0.5397, "lr": 5e-06, "epoch": 1.7955112219451372, "percentage": 60.0, "elapsed_time": "1:26:57", "remaining_time": "0:57:58"}
|
11 |
{"current_steps": 100, "total_steps": 150, "loss": 0.5438, "lr": 5e-06, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:36:23", "remaining_time": "0:48:11"}
|
12 |
{"current_steps": 100, "total_steps": 150, "eval_loss": 0.5740869641304016, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:37:29", "remaining_time": "0:48:44"}
|
13 |
+
{"current_steps": 110, "total_steps": 150, "loss": 0.5407, "lr": 5e-06, "epoch": 2.1945137157107233, "percentage": 73.33, "elapsed_time": "1:47:51", "remaining_time": "0:39:13"}
|
14 |
+
{"current_steps": 120, "total_steps": 150, "loss": 0.4996, "lr": 5e-06, "epoch": 2.3940149625935163, "percentage": 80.0, "elapsed_time": "1:57:16", "remaining_time": "0:29:19"}
|
15 |
+
{"current_steps": 130, "total_steps": 150, "loss": 0.4972, "lr": 5e-06, "epoch": 2.5935162094763093, "percentage": 86.67, "elapsed_time": "2:06:44", "remaining_time": "0:19:29"}
|
16 |
+
{"current_steps": 140, "total_steps": 150, "loss": 0.4926, "lr": 5e-06, "epoch": 2.7930174563591024, "percentage": 93.33, "elapsed_time": "2:16:11", "remaining_time": "0:09:43"}
|
17 |
+
{"current_steps": 150, "total_steps": 150, "loss": 0.4952, "lr": 5e-06, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:25:37", "remaining_time": "0:00:00"}
|
18 |
+
{"current_steps": 150, "total_steps": 150, "eval_loss": 0.5672302842140198, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:27:42", "remaining_time": "0:00:00"}
|
19 |
+
{"current_steps": 150, "total_steps": 150, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:28:56", "remaining_time": "0:00:00"}
|