Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b7eed145ab81aee983cf736774b464b0e064114f1552a8e2b69c4f7fc46114f
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09db305b1406b3eb8361900bdac92f2cca92831cf6ed6f7fb088ffe294f37c17
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2555567f03757165752020cfb88c034609ab12124095ab0e912d73ccaaea7b07
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a7529c2b70f47e0793e27b44ef69c308b9c4efa18d512289f98c10174652184
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -1,3 +1,6 @@
|
|
1 |
{"current_steps": 10, "total_steps": 54, "loss": 1.1508, "lr": 5e-06, "epoch": 0.5298013245033113, "percentage": 18.52, "elapsed_time": "0:05:26", "remaining_time": "0:23:54"}
|
2 |
{"current_steps": 18, "total_steps": 54, "eval_loss": 1.0110349655151367, "epoch": 0.9536423841059603, "percentage": 33.33, "elapsed_time": "0:10:13", "remaining_time": "0:20:26"}
|
3 |
{"current_steps": 20, "total_steps": 54, "loss": 1.0692, "lr": 5e-06, "epoch": 1.0728476821192052, "percentage": 37.04, "elapsed_time": "0:12:11", "remaining_time": "0:20:43"}
|
|
|
|
|
|
|
|
1 |
{"current_steps": 10, "total_steps": 54, "loss": 1.1508, "lr": 5e-06, "epoch": 0.5298013245033113, "percentage": 18.52, "elapsed_time": "0:05:26", "remaining_time": "0:23:54"}
|
2 |
{"current_steps": 18, "total_steps": 54, "eval_loss": 1.0110349655151367, "epoch": 0.9536423841059603, "percentage": 33.33, "elapsed_time": "0:10:13", "remaining_time": "0:20:26"}
|
3 |
{"current_steps": 20, "total_steps": 54, "loss": 1.0692, "lr": 5e-06, "epoch": 1.0728476821192052, "percentage": 37.04, "elapsed_time": "0:12:11", "remaining_time": "0:20:43"}
|
4 |
+
{"current_steps": 30, "total_steps": 54, "loss": 0.9634, "lr": 5e-06, "epoch": 1.6026490066225165, "percentage": 55.56, "elapsed_time": "0:17:29", "remaining_time": "0:13:59"}
|
5 |
+
{"current_steps": 37, "total_steps": 54, "eval_loss": 0.9528446197509766, "epoch": 1.9735099337748343, "percentage": 68.52, "elapsed_time": "0:21:26", "remaining_time": "0:09:51"}
|
6 |
+
{"current_steps": 40, "total_steps": 54, "loss": 0.9627, "lr": 5e-06, "epoch": 2.1456953642384105, "percentage": 74.07, "elapsed_time": "0:24:10", "remaining_time": "0:08:27"}
|