Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebbe14efe580784ef2d4a8d10c70ae1941a7481e531e14d86299a7db46b5ce3a
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bde40f127fb70ad4b2cce347d8e8efda6b8c51d0d5d925cba6b936f6910e8a58
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd281ac452aa1b0c543d92e0b78e8cff8976da44b829aabaf0727adabc941d15
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e01304b587dd6f964fca04068c3ec50100379a2645a618a43038cf6c309f9b31
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -4,3 +4,10 @@
|
|
4 |
{"current_steps": 40, "total_steps": 165, "loss": 0.6256, "lr": 5e-06, "epoch": 0.7223476297968398, "percentage": 24.24, "elapsed_time": "0:21:29", "remaining_time": "1:07:10"}
|
5 |
{"current_steps": 50, "total_steps": 165, "loss": 0.6154, "lr": 5e-06, "epoch": 0.9029345372460497, "percentage": 30.3, "elapsed_time": "0:26:48", "remaining_time": "1:01:39"}
|
6 |
{"current_steps": 55, "total_steps": 165, "eval_loss": 0.5993303656578064, "epoch": 0.9932279909706546, "percentage": 33.33, "elapsed_time": "0:30:18", "remaining_time": "1:00:36"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4 |
{"current_steps": 40, "total_steps": 165, "loss": 0.6256, "lr": 5e-06, "epoch": 0.7223476297968398, "percentage": 24.24, "elapsed_time": "0:21:29", "remaining_time": "1:07:10"}
|
5 |
{"current_steps": 50, "total_steps": 165, "loss": 0.6154, "lr": 5e-06, "epoch": 0.9029345372460497, "percentage": 30.3, "elapsed_time": "0:26:48", "remaining_time": "1:01:39"}
|
6 |
{"current_steps": 55, "total_steps": 165, "eval_loss": 0.5993303656578064, "epoch": 0.9932279909706546, "percentage": 33.33, "elapsed_time": "0:30:18", "remaining_time": "1:00:36"}
|
7 |
+
{"current_steps": 60, "total_steps": 165, "loss": 0.6293, "lr": 5e-06, "epoch": 1.0835214446952597, "percentage": 36.36, "elapsed_time": "0:33:58", "remaining_time": "0:59:27"}
|
8 |
+
{"current_steps": 70, "total_steps": 165, "loss": 0.5656, "lr": 5e-06, "epoch": 1.2641083521444696, "percentage": 42.42, "elapsed_time": "0:39:17", "remaining_time": "0:53:20"}
|
9 |
+
{"current_steps": 80, "total_steps": 165, "loss": 0.5588, "lr": 5e-06, "epoch": 1.4446952595936795, "percentage": 48.48, "elapsed_time": "0:44:38", "remaining_time": "0:47:25"}
|
10 |
+
{"current_steps": 90, "total_steps": 165, "loss": 0.561, "lr": 5e-06, "epoch": 1.6252821670428894, "percentage": 54.55, "elapsed_time": "0:49:57", "remaining_time": "0:41:37"}
|
11 |
+
{"current_steps": 100, "total_steps": 165, "loss": 0.5526, "lr": 5e-06, "epoch": 1.8058690744920993, "percentage": 60.61, "elapsed_time": "0:55:15", "remaining_time": "0:35:54"}
|
12 |
+
{"current_steps": 110, "total_steps": 165, "loss": 0.5525, "lr": 5e-06, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:00:34", "remaining_time": "0:30:17"}
|
13 |
+
{"current_steps": 110, "total_steps": 165, "eval_loss": 0.5813493132591248, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:01:33", "remaining_time": "0:30:46"}
|