Training in progress, epoch 2

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6b23d3ca3908602b50aa3f2e6437da7f9b9c5f15fcb93761cac1773ec6485110
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:d79f7fdb4d30aca27223445594ef9b5b7ed91d20dd10692b892f84c2fd9e6ce2
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f2072b661188afb39f1a9aaed6501a64b560b8a78241138711796b26c86bfa3
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:f3ff35a79c27273836277e45fc2d8bfcc697433e7acf6bec5b015852659148db
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1435d48b76817b826795edf405c0fb0d41a885446c6bb8fd369e5bddf41863a
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:c8d0711133bf8229ff230524c63ef3888ef7baf77747ef883dd24514f43369fd
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fce827aace0cf741f8c40211b94ebe325b401c473fd5259d51d2cbcfa2995fb1
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:488bac7d2cdcdccdf2f3be467b16592a0e7a2964211897c99322495182ea61cc
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -6,3 +6,8 @@
 {"current_steps": 50, "total_steps": 93, "loss": 0.9873, "lr": 5e-06, "epoch": 1.6, "percentage": 53.76, "elapsed_time": "0:28:05", "remaining_time": "0:24:09"}
 {"current_steps": 60, "total_steps": 93, "loss": 0.9711, "lr": 5e-06, "epoch": 1.92, "percentage": 64.52, "elapsed_time": "0:33:21", "remaining_time": "0:18:20"}
 {"current_steps": 62, "total_steps": 93, "eval_loss": 0.9961642026901245, "epoch": 1.984, "percentage": 66.67, "elapsed_time": "0:35:00", "remaining_time": "0:17:30"}

 {"current_steps": 50, "total_steps": 93, "loss": 0.9873, "lr": 5e-06, "epoch": 1.6, "percentage": 53.76, "elapsed_time": "0:28:05", "remaining_time": "0:24:09"}
 {"current_steps": 60, "total_steps": 93, "loss": 0.9711, "lr": 5e-06, "epoch": 1.92, "percentage": 64.52, "elapsed_time": "0:33:21", "remaining_time": "0:18:20"}
 {"current_steps": 62, "total_steps": 93, "eval_loss": 0.9961642026901245, "epoch": 1.984, "percentage": 66.67, "elapsed_time": "0:35:00", "remaining_time": "0:17:30"}
+{"current_steps": 70, "total_steps": 93, "loss": 1.008, "lr": 5e-06, "epoch": 2.24, "percentage": 75.27, "elapsed_time": "0:40:15", "remaining_time": "0:13:13"}
+{"current_steps": 80, "total_steps": 93, "loss": 0.9094, "lr": 5e-06, "epoch": 2.56, "percentage": 86.02, "elapsed_time": "0:45:31", "remaining_time": "0:07:23"}
+{"current_steps": 90, "total_steps": 93, "loss": 0.9089, "lr": 5e-06, "epoch": 2.88, "percentage": 96.77, "elapsed_time": "0:50:48", "remaining_time": "0:01:41"}
+{"current_steps": 93, "total_steps": 93, "eval_loss": 0.9772511720657349, "epoch": 2.976, "percentage": 100.0, "elapsed_time": "0:54:03", "remaining_time": "0:00:00"}
+{"current_steps": 93, "total_steps": 93, "epoch": 2.976, "percentage": 100.0, "elapsed_time": "0:55:16", "remaining_time": "0:00:00"}