Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5e6a5e0618d3a3acdfac4fd91a62f411e699007ab38bacbe7bbefa76a72ad22
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91dd3b85dd05b3caa81d1a98a290b257589ecd2c6e33080dcc862caf572a43ac
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f27b08b9dd7e1fe42cda95a25c0ac4fd8b73aab5af0aef5325f47c34f537091d
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9266dd59e94e0c04302fd8a5f884675c67b8162d09d22dff5732314377716358
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -57,3 +57,30 @@
|
|
57 |
{"current_steps": 550, "total_steps": 822, "loss": 0.6708, "learning_rate": 5e-06, "epoch": 2.0072992700729926, "percentage": 66.91, "elapsed_time": "0:58:10", "remaining_time": "0:28:46"}
|
58 |
{"current_steps": 560, "total_steps": 822, "loss": 0.6358, "learning_rate": 5e-06, "epoch": 2.0437956204379564, "percentage": 68.13, "elapsed_time": "0:59:08", "remaining_time": "0:27:40"}
|
59 |
{"current_steps": 570, "total_steps": 822, "loss": 0.6306, "learning_rate": 5e-06, "epoch": 2.0802919708029197, "percentage": 69.34, "elapsed_time": "1:00:06", "remaining_time": "0:26:34"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
57 |
{"current_steps": 550, "total_steps": 822, "loss": 0.6708, "learning_rate": 5e-06, "epoch": 2.0072992700729926, "percentage": 66.91, "elapsed_time": "0:58:10", "remaining_time": "0:28:46"}
|
58 |
{"current_steps": 560, "total_steps": 822, "loss": 0.6358, "learning_rate": 5e-06, "epoch": 2.0437956204379564, "percentage": 68.13, "elapsed_time": "0:59:08", "remaining_time": "0:27:40"}
|
59 |
{"current_steps": 570, "total_steps": 822, "loss": 0.6306, "learning_rate": 5e-06, "epoch": 2.0802919708029197, "percentage": 69.34, "elapsed_time": "1:00:06", "remaining_time": "0:26:34"}
|
60 |
+
{"current_steps": 580, "total_steps": 822, "loss": 0.6289, "learning_rate": 5e-06, "epoch": 2.116788321167883, "percentage": 70.56, "elapsed_time": "1:01:04", "remaining_time": "0:25:29"}
|
61 |
+
{"current_steps": 590, "total_steps": 822, "loss": 0.6303, "learning_rate": 5e-06, "epoch": 2.153284671532847, "percentage": 71.78, "elapsed_time": "1:02:02", "remaining_time": "0:24:23"}
|
62 |
+
{"current_steps": 600, "total_steps": 822, "loss": 0.6291, "learning_rate": 5e-06, "epoch": 2.18978102189781, "percentage": 72.99, "elapsed_time": "1:03:01", "remaining_time": "0:23:19"}
|
63 |
+
{"current_steps": 610, "total_steps": 822, "loss": 0.6266, "learning_rate": 5e-06, "epoch": 2.2262773722627736, "percentage": 74.21, "elapsed_time": "1:03:59", "remaining_time": "0:22:14"}
|
64 |
+
{"current_steps": 620, "total_steps": 822, "loss": 0.6316, "learning_rate": 5e-06, "epoch": 2.2627737226277373, "percentage": 75.43, "elapsed_time": "1:04:57", "remaining_time": "0:21:09"}
|
65 |
+
{"current_steps": 630, "total_steps": 822, "loss": 0.6324, "learning_rate": 5e-06, "epoch": 2.2992700729927007, "percentage": 76.64, "elapsed_time": "1:05:55", "remaining_time": "0:20:05"}
|
66 |
+
{"current_steps": 640, "total_steps": 822, "loss": 0.6276, "learning_rate": 5e-06, "epoch": 2.335766423357664, "percentage": 77.86, "elapsed_time": "1:06:54", "remaining_time": "0:19:01"}
|
67 |
+
{"current_steps": 650, "total_steps": 822, "loss": 0.6376, "learning_rate": 5e-06, "epoch": 2.372262773722628, "percentage": 79.08, "elapsed_time": "1:07:52", "remaining_time": "0:17:57"}
|
68 |
+
{"current_steps": 660, "total_steps": 822, "loss": 0.6287, "learning_rate": 5e-06, "epoch": 2.408759124087591, "percentage": 80.29, "elapsed_time": "1:08:50", "remaining_time": "0:16:53"}
|
69 |
+
{"current_steps": 670, "total_steps": 822, "loss": 0.6355, "learning_rate": 5e-06, "epoch": 2.445255474452555, "percentage": 81.51, "elapsed_time": "1:09:48", "remaining_time": "0:15:50"}
|
70 |
+
{"current_steps": 680, "total_steps": 822, "loss": 0.6361, "learning_rate": 5e-06, "epoch": 2.4817518248175183, "percentage": 82.73, "elapsed_time": "1:10:46", "remaining_time": "0:14:46"}
|
71 |
+
{"current_steps": 690, "total_steps": 822, "loss": 0.6377, "learning_rate": 5e-06, "epoch": 2.5182481751824817, "percentage": 83.94, "elapsed_time": "1:11:45", "remaining_time": "0:13:43"}
|
72 |
+
{"current_steps": 700, "total_steps": 822, "loss": 0.6348, "learning_rate": 5e-06, "epoch": 2.554744525547445, "percentage": 85.16, "elapsed_time": "1:12:43", "remaining_time": "0:12:40"}
|
73 |
+
{"current_steps": 710, "total_steps": 822, "loss": 0.6409, "learning_rate": 5e-06, "epoch": 2.591240875912409, "percentage": 86.37, "elapsed_time": "1:13:41", "remaining_time": "0:11:37"}
|
74 |
+
{"current_steps": 720, "total_steps": 822, "loss": 0.6295, "learning_rate": 5e-06, "epoch": 2.627737226277372, "percentage": 87.59, "elapsed_time": "1:14:39", "remaining_time": "0:10:34"}
|
75 |
+
{"current_steps": 730, "total_steps": 822, "loss": 0.6353, "learning_rate": 5e-06, "epoch": 2.664233576642336, "percentage": 88.81, "elapsed_time": "1:15:37", "remaining_time": "0:09:31"}
|
76 |
+
{"current_steps": 740, "total_steps": 822, "loss": 0.6363, "learning_rate": 5e-06, "epoch": 2.7007299270072993, "percentage": 90.02, "elapsed_time": "1:16:36", "remaining_time": "0:08:29"}
|
77 |
+
{"current_steps": 750, "total_steps": 822, "loss": 0.6349, "learning_rate": 5e-06, "epoch": 2.7372262773722627, "percentage": 91.24, "elapsed_time": "1:17:34", "remaining_time": "0:07:26"}
|
78 |
+
{"current_steps": 760, "total_steps": 822, "loss": 0.6407, "learning_rate": 5e-06, "epoch": 2.7737226277372264, "percentage": 92.46, "elapsed_time": "1:18:32", "remaining_time": "0:06:24"}
|
79 |
+
{"current_steps": 770, "total_steps": 822, "loss": 0.631, "learning_rate": 5e-06, "epoch": 2.81021897810219, "percentage": 93.67, "elapsed_time": "1:19:30", "remaining_time": "0:05:22"}
|
80 |
+
{"current_steps": 780, "total_steps": 822, "loss": 0.6298, "learning_rate": 5e-06, "epoch": 2.846715328467153, "percentage": 94.89, "elapsed_time": "1:20:28", "remaining_time": "0:04:20"}
|
81 |
+
{"current_steps": 790, "total_steps": 822, "loss": 0.6325, "learning_rate": 5e-06, "epoch": 2.883211678832117, "percentage": 96.11, "elapsed_time": "1:21:27", "remaining_time": "0:03:17"}
|
82 |
+
{"current_steps": 800, "total_steps": 822, "loss": 0.6425, "learning_rate": 5e-06, "epoch": 2.9197080291970803, "percentage": 97.32, "elapsed_time": "1:22:25", "remaining_time": "0:02:15"}
|
83 |
+
{"current_steps": 810, "total_steps": 822, "loss": 0.6323, "learning_rate": 5e-06, "epoch": 2.9562043795620436, "percentage": 98.54, "elapsed_time": "1:23:23", "remaining_time": "0:01:14"}
|
84 |
+
{"current_steps": 820, "total_steps": 822, "loss": 0.6383, "learning_rate": 5e-06, "epoch": 2.9927007299270074, "percentage": 99.76, "elapsed_time": "1:24:21", "remaining_time": "0:00:12"}
|
85 |
+
{"current_steps": 822, "total_steps": 822, "eval_loss": 0.7370563745498657, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:26:35", "remaining_time": "0:00:00"}
|
86 |
+
{"current_steps": 822, "total_steps": 822, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:28:03", "remaining_time": "0:00:00"}
|