Training in progress, epoch 2

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:84cc546ea88454b30ea0b32cd0f00f215939150cc60dfb2d75cf3febf9e88366
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:9e153f7ad2a2541e1730bc6516e95f20afa25ba0977fd3db749028c003290822
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e8ab5d0e4a635af5a4c445297a1b8d3f18d50e635fbee057ae5847e707f28ac4
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:ba4582466093af613091ea02ab8aca86c115fdc6ace3856f73c81b5934113cbd
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c1009fab4e5c6f7bea720958b4ad4874b8e34cd8859ba166f9bc30cdb6249fcc
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:f3346a7cdb9f200a8a594f1affd3865239624b653b0a4a3c92d45ceb2603e749
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b4cd0aaf8d5c7ecf6c1ff628cd6c6e9ec4a149a10bbb141822056f17c629e0a4
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:2ac4cf753de190970fa6e1062de29b4e0f794d29442fe5c2be97fc3ee6ff0391
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -6,3 +6,8 @@
 {"current_steps": 50, "total_steps": 93, "loss": 0.4113, "lr": 5e-06, "epoch": 1.594488188976378, "percentage": 53.76, "elapsed_time": "0:49:49", "remaining_time": "0:42:51"}
 {"current_steps": 60, "total_steps": 93, "loss": 0.4167, "lr": 5e-06, "epoch": 1.909448818897638, "percentage": 64.52, "elapsed_time": "0:59:28", "remaining_time": "0:32:42"}
 {"current_steps": 62, "total_steps": 93, "eval_loss": 0.4076673686504364, "epoch": 1.9724409448818898, "percentage": 66.67, "elapsed_time": "1:02:13", "remaining_time": "0:31:06"}

 {"current_steps": 50, "total_steps": 93, "loss": 0.4113, "lr": 5e-06, "epoch": 1.594488188976378, "percentage": 53.76, "elapsed_time": "0:49:49", "remaining_time": "0:42:51"}
 {"current_steps": 60, "total_steps": 93, "loss": 0.4167, "lr": 5e-06, "epoch": 1.909448818897638, "percentage": 64.52, "elapsed_time": "0:59:28", "remaining_time": "0:32:42"}
 {"current_steps": 62, "total_steps": 93, "eval_loss": 0.4076673686504364, "epoch": 1.9724409448818898, "percentage": 66.67, "elapsed_time": "1:02:13", "remaining_time": "0:31:06"}
+{"current_steps": 70, "total_steps": 93, "loss": 0.4311, "lr": 5e-06, "epoch": 2.2440944881889764, "percentage": 75.27, "elapsed_time": "1:10:54", "remaining_time": "0:23:17"}
+{"current_steps": 80, "total_steps": 93, "loss": 0.3895, "lr": 5e-06, "epoch": 2.559055118110236, "percentage": 86.02, "elapsed_time": "1:20:31", "remaining_time": "0:13:05"}
+{"current_steps": 90, "total_steps": 93, "loss": 0.3872, "lr": 5e-06, "epoch": 2.8740157480314963, "percentage": 96.77, "elapsed_time": "1:30:08", "remaining_time": "0:03:00"}
+{"current_steps": 93, "total_steps": 93, "eval_loss": 0.400202214717865, "epoch": 2.968503937007874, "percentage": 100.0, "elapsed_time": "1:34:49", "remaining_time": "0:00:00"}
+{"current_steps": 93, "total_steps": 93, "epoch": 2.968503937007874, "percentage": 100.0, "elapsed_time": "1:36:03", "remaining_time": "0:00:00"}