Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8fe19691e4a35c0142886245a9c9d6c76bfcf8ff3be2aaf6dccb22b5f715832
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b34086a26530b212468d4b9a2acc82e75322af97b706898950ec64d16ab5cb5
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53aedb5a0be2a86e8dcf4d601e2bd9d0b03629b2ad71e8bfceacd6ce9d392e50
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd57f1868de4b0c74b45315de3db4d764b40994450931c21cb09d2fc839990b9
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -40,3 +40,23 @@
|
|
40 |
{"current_steps": 390, "total_steps": 600, "loss": 0.7478, "lr": 5e-06, "epoch": 1.947565543071161, "percentage": 65.0, "elapsed_time": "6:18:18", "remaining_time": "3:23:42"}
|
41 |
{"current_steps": 400, "total_steps": 600, "loss": 0.7538, "lr": 5e-06, "epoch": 1.9975031210986267, "percentage": 66.67, "elapsed_time": "6:27:52", "remaining_time": "3:13:56"}
|
42 |
{"current_steps": 400, "total_steps": 600, "eval_loss": 0.7874204516410828, "epoch": 1.9975031210986267, "percentage": 66.67, "elapsed_time": "6:31:51", "remaining_time": "3:15:55"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
40 |
{"current_steps": 390, "total_steps": 600, "loss": 0.7478, "lr": 5e-06, "epoch": 1.947565543071161, "percentage": 65.0, "elapsed_time": "6:18:18", "remaining_time": "3:23:42"}
|
41 |
{"current_steps": 400, "total_steps": 600, "loss": 0.7538, "lr": 5e-06, "epoch": 1.9975031210986267, "percentage": 66.67, "elapsed_time": "6:27:52", "remaining_time": "3:13:56"}
|
42 |
{"current_steps": 400, "total_steps": 600, "eval_loss": 0.7874204516410828, "epoch": 1.9975031210986267, "percentage": 66.67, "elapsed_time": "6:31:51", "remaining_time": "3:15:55"}
|
43 |
+
{"current_steps": 410, "total_steps": 600, "loss": 0.7611, "lr": 5e-06, "epoch": 2.0474406991260925, "percentage": 68.33, "elapsed_time": "6:42:13", "remaining_time": "3:06:23"}
|
44 |
+
{"current_steps": 420, "total_steps": 600, "loss": 0.7037, "lr": 5e-06, "epoch": 2.097378277153558, "percentage": 70.0, "elapsed_time": "6:51:48", "remaining_time": "2:56:29"}
|
45 |
+
{"current_steps": 430, "total_steps": 600, "loss": 0.7089, "lr": 5e-06, "epoch": 2.1473158551810236, "percentage": 71.67, "elapsed_time": "7:01:22", "remaining_time": "2:46:35"}
|
46 |
+
{"current_steps": 440, "total_steps": 600, "loss": 0.7057, "lr": 5e-06, "epoch": 2.1972534332084894, "percentage": 73.33, "elapsed_time": "7:10:58", "remaining_time": "2:36:43"}
|
47 |
+
{"current_steps": 450, "total_steps": 600, "loss": 0.706, "lr": 5e-06, "epoch": 2.247191011235955, "percentage": 75.0, "elapsed_time": "7:20:32", "remaining_time": "2:26:50"}
|
48 |
+
{"current_steps": 460, "total_steps": 600, "loss": 0.7064, "lr": 5e-06, "epoch": 2.2971285892634206, "percentage": 76.67, "elapsed_time": "7:30:07", "remaining_time": "2:16:59"}
|
49 |
+
{"current_steps": 470, "total_steps": 600, "loss": 0.7049, "lr": 5e-06, "epoch": 2.3470661672908864, "percentage": 78.33, "elapsed_time": "7:39:41", "remaining_time": "2:07:08"}
|
50 |
+
{"current_steps": 480, "total_steps": 600, "loss": 0.705, "lr": 5e-06, "epoch": 2.397003745318352, "percentage": 80.0, "elapsed_time": "7:49:16", "remaining_time": "1:57:19"}
|
51 |
+
{"current_steps": 490, "total_steps": 600, "loss": 0.709, "lr": 5e-06, "epoch": 2.4469413233458175, "percentage": 81.67, "elapsed_time": "7:58:51", "remaining_time": "1:47:29"}
|
52 |
+
{"current_steps": 500, "total_steps": 600, "loss": 0.71, "lr": 5e-06, "epoch": 2.4968789013732833, "percentage": 83.33, "elapsed_time": "8:08:27", "remaining_time": "1:37:41"}
|
53 |
+
{"current_steps": 510, "total_steps": 600, "loss": 0.7128, "lr": 5e-06, "epoch": 2.546816479400749, "percentage": 85.0, "elapsed_time": "8:18:02", "remaining_time": "1:27:53"}
|
54 |
+
{"current_steps": 520, "total_steps": 600, "loss": 0.7116, "lr": 5e-06, "epoch": 2.596754057428215, "percentage": 86.67, "elapsed_time": "8:27:37", "remaining_time": "1:18:05"}
|
55 |
+
{"current_steps": 530, "total_steps": 600, "loss": 0.711, "lr": 5e-06, "epoch": 2.6466916354556806, "percentage": 88.33, "elapsed_time": "8:37:14", "remaining_time": "1:08:18"}
|
56 |
+
{"current_steps": 540, "total_steps": 600, "loss": 0.706, "lr": 5e-06, "epoch": 2.696629213483146, "percentage": 90.0, "elapsed_time": "8:46:49", "remaining_time": "0:58:32"}
|
57 |
+
{"current_steps": 550, "total_steps": 600, "loss": 0.7144, "lr": 5e-06, "epoch": 2.746566791510612, "percentage": 91.67, "elapsed_time": "8:56:25", "remaining_time": "0:48:45"}
|
58 |
+
{"current_steps": 560, "total_steps": 600, "loss": 0.708, "lr": 5e-06, "epoch": 2.796504369538077, "percentage": 93.33, "elapsed_time": "9:06:01", "remaining_time": "0:39:00"}
|
59 |
+
{"current_steps": 570, "total_steps": 600, "loss": 0.7147, "lr": 5e-06, "epoch": 2.846441947565543, "percentage": 95.0, "elapsed_time": "9:15:36", "remaining_time": "0:29:14"}
|
60 |
+
{"current_steps": 580, "total_steps": 600, "loss": 0.7114, "lr": 5e-06, "epoch": 2.8963795255930087, "percentage": 96.67, "elapsed_time": "9:25:12", "remaining_time": "0:19:29"}
|
61 |
+
{"current_steps": 590, "total_steps": 600, "loss": 0.7072, "lr": 5e-06, "epoch": 2.9463171036204745, "percentage": 98.33, "elapsed_time": "9:34:47", "remaining_time": "0:09:44"}
|
62 |
+
{"current_steps": 600, "total_steps": 600, "loss": 0.7158, "lr": 5e-06, "epoch": 2.9962546816479403, "percentage": 100.0, "elapsed_time": "9:44:23", "remaining_time": "0:00:00"}
|