Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2279fe66849158fb64c40d3eb08e49a75b50c07246a5a462fef74c738752aa50
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e99976b48e522006f40fd4d146546d4a6ecf5e24da95e5b44f9fa833c01211f0
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a803a85980fc6c9c5aed172005bfa752f771c5e179ca4612b4068c32ef67dd4a
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:113bb9aa3a2605e915daa8a2fa9a1a237077a4f1167e19d49d6ea205bc049a7e
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -8,3 +8,8 @@
|
|
8 |
{"current_steps": 70, "total_steps": 117, "loss": 0.4657, "lr": 5e-06, "epoch": 1.7948717948717947, "percentage": 59.83, "elapsed_time": "1:08:59", "remaining_time": "0:46:19"}
|
9 |
{"current_steps": 78, "total_steps": 117, "eval_loss": 0.48121070861816406, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:17:21", "remaining_time": "0:38:40"}
|
10 |
{"current_steps": 80, "total_steps": 117, "loss": 0.4509, "lr": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "1:20:27", "remaining_time": "0:37:12"}
|
|
|
|
|
|
|
|
|
|
|
|
8 |
{"current_steps": 70, "total_steps": 117, "loss": 0.4657, "lr": 5e-06, "epoch": 1.7948717948717947, "percentage": 59.83, "elapsed_time": "1:08:59", "remaining_time": "0:46:19"}
|
9 |
{"current_steps": 78, "total_steps": 117, "eval_loss": 0.48121070861816406, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:17:21", "remaining_time": "0:38:40"}
|
10 |
{"current_steps": 80, "total_steps": 117, "loss": 0.4509, "lr": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "1:20:27", "remaining_time": "0:37:12"}
|
11 |
+
{"current_steps": 90, "total_steps": 117, "loss": 0.4352, "lr": 5e-06, "epoch": 2.3076923076923075, "percentage": 76.92, "elapsed_time": "1:30:03", "remaining_time": "0:27:01"}
|
12 |
+
{"current_steps": 100, "total_steps": 117, "loss": 0.4268, "lr": 5e-06, "epoch": 2.564102564102564, "percentage": 85.47, "elapsed_time": "1:39:40", "remaining_time": "0:16:56"}
|
13 |
+
{"current_steps": 110, "total_steps": 117, "loss": 0.4298, "lr": 5e-06, "epoch": 2.8205128205128203, "percentage": 94.02, "elapsed_time": "1:49:16", "remaining_time": "0:06:57"}
|
14 |
+
{"current_steps": 117, "total_steps": 117, "eval_loss": 0.4801027178764343, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:57:53", "remaining_time": "0:00:00"}
|
15 |
+
{"current_steps": 117, "total_steps": 117, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:59:07", "remaining_time": "0:00:00"}
|