Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b23d3ca3908602b50aa3f2e6437da7f9b9c5f15fcb93761cac1773ec6485110
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f2072b661188afb39f1a9aaed6501a64b560b8a78241138711796b26c86bfa3
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1435d48b76817b826795edf405c0fb0d41a885446c6bb8fd369e5bddf41863a
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fce827aace0cf741f8c40211b94ebe325b401c473fd5259d51d2cbcfa2995fb1
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -2,3 +2,7 @@
|
|
2 |
{"current_steps": 20, "total_steps": 93, "loss": 1.1085, "lr": 5e-06, "epoch": 0.64, "percentage": 21.51, "elapsed_time": "0:10:40", "remaining_time": "0:38:57"}
|
3 |
{"current_steps": 30, "total_steps": 93, "loss": 1.0621, "lr": 5e-06, "epoch": 0.96, "percentage": 32.26, "elapsed_time": "0:15:57", "remaining_time": "0:33:30"}
|
4 |
{"current_steps": 31, "total_steps": 93, "eval_loss": 1.0408542156219482, "epoch": 0.992, "percentage": 33.33, "elapsed_time": "0:16:59", "remaining_time": "0:33:59"}
|
|
|
|
|
|
|
|
|
|
2 |
{"current_steps": 20, "total_steps": 93, "loss": 1.1085, "lr": 5e-06, "epoch": 0.64, "percentage": 21.51, "elapsed_time": "0:10:40", "remaining_time": "0:38:57"}
|
3 |
{"current_steps": 30, "total_steps": 93, "loss": 1.0621, "lr": 5e-06, "epoch": 0.96, "percentage": 32.26, "elapsed_time": "0:15:57", "remaining_time": "0:33:30"}
|
4 |
{"current_steps": 31, "total_steps": 93, "eval_loss": 1.0408542156219482, "epoch": 0.992, "percentage": 33.33, "elapsed_time": "0:16:59", "remaining_time": "0:33:59"}
|
5 |
+
{"current_steps": 40, "total_steps": 93, "loss": 1.0841, "lr": 5e-06, "epoch": 1.28, "percentage": 43.01, "elapsed_time": "0:22:49", "remaining_time": "0:30:14"}
|
6 |
+
{"current_steps": 50, "total_steps": 93, "loss": 0.9873, "lr": 5e-06, "epoch": 1.6, "percentage": 53.76, "elapsed_time": "0:28:05", "remaining_time": "0:24:09"}
|
7 |
+
{"current_steps": 60, "total_steps": 93, "loss": 0.9711, "lr": 5e-06, "epoch": 1.92, "percentage": 64.52, "elapsed_time": "0:33:21", "remaining_time": "0:18:20"}
|
8 |
+
{"current_steps": 62, "total_steps": 93, "eval_loss": 0.9961642026901245, "epoch": 1.984, "percentage": 66.67, "elapsed_time": "0:35:00", "remaining_time": "0:17:30"}
|