gsmyrnis commited on
Commit
30ebb24
·
verified ·
1 Parent(s): 4b28e9a

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5a18b4cd23249d5f1371851cf6641cc0ea68befa57401db700c6a1a7abaca1a
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b0b5175b6a6b9ad16bfd112c64593e5045467539873c235b6b63dffa4825faf
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16d81277902f6f54fba1db78a5a241facf3fd458ec7996e42b8aec781031c9dd
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7b4440dd2c3e05b2345f5a053f9c0f4c1374a371368d01a989144772de7d031
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7e489a73ad30e2db985afbfbfb37285d92dac6061749f8c8fd4576d5eb85ac5
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a4a7cfe98706a690663577ae16aa276360950389536835f504d6492f6a8c4df
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f503bc03deb1c6776f8a28b3cf6f77f855b0760fc61b4ac468b9c05699225f3c
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab2f6de02a913adafd867ce7e80dd0df8e63afe4eaf60870c81ee98bab0e36e7
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -121,3 +121,12 @@
121
  {"current_steps": 1190, "total_steps": 1281, "loss": 0.4704, "lr": 5e-06, "epoch": 2.7868852459016393, "percentage": 92.9, "elapsed_time": "2:02:11", "remaining_time": "0:09:20"}
122
  {"current_steps": 1200, "total_steps": 1281, "loss": 0.4707, "lr": 5e-06, "epoch": 2.810304449648712, "percentage": 93.68, "elapsed_time": "2:03:11", "remaining_time": "0:08:18"}
123
  {"current_steps": 1210, "total_steps": 1281, "loss": 0.4679, "lr": 5e-06, "epoch": 2.8337236533957846, "percentage": 94.46, "elapsed_time": "2:04:10", "remaining_time": "0:07:17"}
 
 
 
 
 
 
 
 
 
 
121
  {"current_steps": 1190, "total_steps": 1281, "loss": 0.4704, "lr": 5e-06, "epoch": 2.7868852459016393, "percentage": 92.9, "elapsed_time": "2:02:11", "remaining_time": "0:09:20"}
122
  {"current_steps": 1200, "total_steps": 1281, "loss": 0.4707, "lr": 5e-06, "epoch": 2.810304449648712, "percentage": 93.68, "elapsed_time": "2:03:11", "remaining_time": "0:08:18"}
123
  {"current_steps": 1210, "total_steps": 1281, "loss": 0.4679, "lr": 5e-06, "epoch": 2.8337236533957846, "percentage": 94.46, "elapsed_time": "2:04:10", "remaining_time": "0:07:17"}
124
+ {"current_steps": 1220, "total_steps": 1281, "loss": 0.4711, "lr": 5e-06, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "2:05:09", "remaining_time": "0:06:15"}
125
+ {"current_steps": 1230, "total_steps": 1281, "loss": 0.4653, "lr": 5e-06, "epoch": 2.88056206088993, "percentage": 96.02, "elapsed_time": "2:06:08", "remaining_time": "0:05:13"}
126
+ {"current_steps": 1240, "total_steps": 1281, "loss": 0.4667, "lr": 5e-06, "epoch": 2.9039812646370025, "percentage": 96.8, "elapsed_time": "2:07:08", "remaining_time": "0:04:12"}
127
+ {"current_steps": 1250, "total_steps": 1281, "loss": 0.4664, "lr": 5e-06, "epoch": 2.927400468384075, "percentage": 97.58, "elapsed_time": "2:08:08", "remaining_time": "0:03:10"}
128
+ {"current_steps": 1260, "total_steps": 1281, "loss": 0.468, "lr": 5e-06, "epoch": 2.9508196721311473, "percentage": 98.36, "elapsed_time": "2:09:09", "remaining_time": "0:02:09"}
129
+ {"current_steps": 1270, "total_steps": 1281, "loss": 0.4654, "lr": 5e-06, "epoch": 2.9742388758782203, "percentage": 99.14, "elapsed_time": "2:10:09", "remaining_time": "0:01:07"}
130
+ {"current_steps": 1280, "total_steps": 1281, "loss": 0.47, "lr": 5e-06, "epoch": 2.9976580796252925, "percentage": 99.92, "elapsed_time": "2:11:08", "remaining_time": "0:00:06"}
131
+ {"current_steps": 1281, "total_steps": 1281, "eval_loss": 0.5069288611412048, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:13:48", "remaining_time": "0:00:00"}
132
+ {"current_steps": 1281, "total_steps": 1281, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2:15:16", "remaining_time": "0:00:00"}