sedrickkeh commited on
Commit
3226b49
·
verified ·
1 Parent(s): 4b064e8

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6dff757afc02e4fbf7be2a0780ba0a0bb5eb1e76bbf546418bf19528f1f5bb5
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84cc546ea88454b30ea0b32cd0f00f215939150cc60dfb2d75cf3febf9e88366
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3ee1719ac1367cfd9c6dae658ce9fd612b6206a04c9eee6d8214fd289bebf82
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8ab5d0e4a635af5a4c445297a1b8d3f18d50e635fbee057ae5847e707f28ac4
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e6045d2c756cbc596e678362bb9345767687b3e28968216154e9f5054ccc4a1
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1009fab4e5c6f7bea720958b4ad4874b8e34cd8859ba166f9bc30cdb6249fcc
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f536f38b522cab40b2d04c172745cd434990ab6150a6d37ea08345c3bd44487
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4cd0aaf8d5c7ecf6c1ff628cd6c6e9ec4a149a10bbb141822056f17c629e0a4
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -2,3 +2,7 @@
2
  {"current_steps": 20, "total_steps": 93, "loss": 0.4778, "lr": 5e-06, "epoch": 0.6299212598425197, "percentage": 21.51, "elapsed_time": "0:19:16", "remaining_time": "1:10:20"}
3
  {"current_steps": 30, "total_steps": 93, "loss": 0.4472, "lr": 5e-06, "epoch": 0.9448818897637795, "percentage": 32.26, "elapsed_time": "0:28:53", "remaining_time": "1:00:39"}
4
  {"current_steps": 31, "total_steps": 93, "eval_loss": 0.43012088537216187, "epoch": 0.9763779527559056, "percentage": 33.33, "elapsed_time": "0:30:33", "remaining_time": "1:01:06"}
 
 
 
 
 
2
  {"current_steps": 20, "total_steps": 93, "loss": 0.4778, "lr": 5e-06, "epoch": 0.6299212598425197, "percentage": 21.51, "elapsed_time": "0:19:16", "remaining_time": "1:10:20"}
3
  {"current_steps": 30, "total_steps": 93, "loss": 0.4472, "lr": 5e-06, "epoch": 0.9448818897637795, "percentage": 32.26, "elapsed_time": "0:28:53", "remaining_time": "1:00:39"}
4
  {"current_steps": 31, "total_steps": 93, "eval_loss": 0.43012088537216187, "epoch": 0.9763779527559056, "percentage": 33.33, "elapsed_time": "0:30:33", "remaining_time": "1:01:06"}
5
+ {"current_steps": 40, "total_steps": 93, "loss": 0.4667, "lr": 5e-06, "epoch": 1.279527559055118, "percentage": 43.01, "elapsed_time": "0:40:12", "remaining_time": "0:53:17"}
6
+ {"current_steps": 50, "total_steps": 93, "loss": 0.4113, "lr": 5e-06, "epoch": 1.594488188976378, "percentage": 53.76, "elapsed_time": "0:49:49", "remaining_time": "0:42:51"}
7
+ {"current_steps": 60, "total_steps": 93, "loss": 0.4167, "lr": 5e-06, "epoch": 1.909448818897638, "percentage": 64.52, "elapsed_time": "0:59:28", "remaining_time": "0:32:42"}
8
+ {"current_steps": 62, "total_steps": 93, "eval_loss": 0.4076673686504364, "epoch": 1.9724409448818898, "percentage": 66.67, "elapsed_time": "1:02:13", "remaining_time": "0:31:06"}