Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b0b5175b6a6b9ad16bfd112c64593e5045467539873c235b6b63dffa4825faf
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7b4440dd2c3e05b2345f5a053f9c0f4c1374a371368d01a989144772de7d031
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a4a7cfe98706a690663577ae16aa276360950389536835f504d6492f6a8c4df
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab2f6de02a913adafd867ce7e80dd0df8e63afe4eaf60870c81ee98bab0e36e7
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -121,3 +121,12 @@
|
|
121 |
{"current_steps": 1190, "total_steps": 1281, "loss": 0.4704, "lr": 5e-06, "epoch": 2.7868852459016393, "percentage": 92.9, "elapsed_time": "2:02:11", "remaining_time": "0:09:20"}
|
122 |
{"current_steps": 1200, "total_steps": 1281, "loss": 0.4707, "lr": 5e-06, "epoch": 2.810304449648712, "percentage": 93.68, "elapsed_time": "2:03:11", "remaining_time": "0:08:18"}
|
123 |
{"current_steps": 1210, "total_steps": 1281, "loss": 0.4679, "lr": 5e-06, "epoch": 2.8337236533957846, "percentage": 94.46, "elapsed_time": "2:04:10", "remaining_time": "0:07:17"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
121 |
{"current_steps": 1190, "total_steps": 1281, "loss": 0.4704, "lr": 5e-06, "epoch": 2.7868852459016393, "percentage": 92.9, "elapsed_time": "2:02:11", "remaining_time": "0:09:20"}
|
122 |
{"current_steps": 1200, "total_steps": 1281, "loss": 0.4707, "lr": 5e-06, "epoch": 2.810304449648712, "percentage": 93.68, "elapsed_time": "2:03:11", "remaining_time": "0:08:18"}
|
123 |
{"current_steps": 1210, "total_steps": 1281, "loss": 0.4679, "lr": 5e-06, "epoch": 2.8337236533957846, "percentage": 94.46, "elapsed_time": "2:04:10", "remaining_time": "0:07:17"}
|
124 |
+
{"current_steps": 1220, "total_steps": 1281, "loss": 0.4711, "lr": 5e-06, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "2:05:09", "remaining_time": "0:06:15"}
|
125 |
+
{"current_steps": 1230, "total_steps": 1281, "loss": 0.4653, "lr": 5e-06, "epoch": 2.88056206088993, "percentage": 96.02, "elapsed_time": "2:06:08", "remaining_time": "0:05:13"}
|
126 |
+
{"current_steps": 1240, "total_steps": 1281, "loss": 0.4667, "lr": 5e-06, "epoch": 2.9039812646370025, "percentage": 96.8, "elapsed_time": "2:07:08", "remaining_time": "0:04:12"}
|
127 |
+
{"current_steps": 1250, "total_steps": 1281, "loss": 0.4664, "lr": 5e-06, "epoch": 2.927400468384075, "percentage": 97.58, "elapsed_time": "2:08:08", "remaining_time": "0:03:10"}
|
128 |
+
{"current_steps": 1260, "total_steps": 1281, "loss": 0.468, "lr": 5e-06, "epoch": 2.9508196721311473, "percentage": 98.36, "elapsed_time": "2:09:09", "remaining_time": "0:02:09"}
|
129 |
+
{"current_steps": 1270, "total_steps": 1281, "loss": 0.4654, "lr": 5e-06, "epoch": 2.9742388758782203, "percentage": 99.14, "elapsed_time": "2:10:09", "remaining_time": "0:01:07"}
|
130 |
+
{"current_steps": 1280, "total_steps": 1281, "loss": 0.47, "lr": 5e-06, "epoch": 2.9976580796252925, "percentage": 99.92, "elapsed_time": "2:11:08", "remaining_time": "0:00:06"}
|
131 |
+
{"current_steps": 1281, "total_steps": 1281, "eval_loss": 0.5069288611412048, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:13:48", "remaining_time": "0:00:00"}
|
132 |
+
{"current_steps": 1281, "total_steps": 1281, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:15:16", "remaining_time": "0:00:00"}
|