Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10f40044d7b17ce24f62f6ce38c85841b8bf8ab6a6c3194b5fb62615602e69dd
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88213520c000e5588cf74d852d57c164dc098609594b8a3cb88cf0ef2fcd9ad3
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70ee644f4419a50d381d2031d9e3df55ded715ec2fb4675c4f87db0c933c6b7b
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4817076e908f5e38543e99e3ca023a71c6ecd39c27df2e9f8dec38ac03d8c20c
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -2,3 +2,8 @@
|
|
2 |
{"current_steps": 20, "total_steps": 108, "loss": 0.9352, "lr": 5e-06, "epoch": 0.5517241379310345, "percentage": 18.52, "elapsed_time": "0:51:59", "remaining_time": "3:48:44"}
|
3 |
{"current_steps": 30, "total_steps": 108, "loss": 0.8976, "lr": 5e-06, "epoch": 0.8275862068965517, "percentage": 27.78, "elapsed_time": "1:17:57", "remaining_time": "3:22:40"}
|
4 |
{"current_steps": 36, "total_steps": 108, "eval_loss": 0.8847346901893616, "epoch": 0.993103448275862, "percentage": 33.33, "elapsed_time": "1:36:09", "remaining_time": "3:12:19"}
|
|
|
|
|
|
|
|
|
|
|
|
2 |
{"current_steps": 20, "total_steps": 108, "loss": 0.9352, "lr": 5e-06, "epoch": 0.5517241379310345, "percentage": 18.52, "elapsed_time": "0:51:59", "remaining_time": "3:48:44"}
|
3 |
{"current_steps": 30, "total_steps": 108, "loss": 0.8976, "lr": 5e-06, "epoch": 0.8275862068965517, "percentage": 27.78, "elapsed_time": "1:17:57", "remaining_time": "3:22:40"}
|
4 |
{"current_steps": 36, "total_steps": 108, "eval_loss": 0.8847346901893616, "epoch": 0.993103448275862, "percentage": 33.33, "elapsed_time": "1:36:09", "remaining_time": "3:12:19"}
|
5 |
+
{"current_steps": 40, "total_steps": 108, "loss": 0.8669, "lr": 5e-06, "epoch": 1.103448275862069, "percentage": 37.04, "elapsed_time": "1:47:22", "remaining_time": "3:02:32"}
|
6 |
+
{"current_steps": 50, "total_steps": 108, "loss": 0.832, "lr": 5e-06, "epoch": 1.3793103448275863, "percentage": 46.3, "elapsed_time": "2:13:18", "remaining_time": "2:34:38"}
|
7 |
+
{"current_steps": 60, "total_steps": 108, "loss": 0.8196, "lr": 5e-06, "epoch": 1.6551724137931034, "percentage": 55.56, "elapsed_time": "2:39:13", "remaining_time": "2:07:23"}
|
8 |
+
{"current_steps": 70, "total_steps": 108, "loss": 0.8134, "lr": 5e-06, "epoch": 1.9310344827586206, "percentage": 64.81, "elapsed_time": "3:05:08", "remaining_time": "1:40:30"}
|
9 |
+
{"current_steps": 72, "total_steps": 108, "eval_loss": 0.8555252552032471, "epoch": 1.986206896551724, "percentage": 66.67, "elapsed_time": "3:13:30", "remaining_time": "1:36:45"}
|