sedrickkeh commited on
Commit
5c85fb5
·
verified ·
1 Parent(s): e92adcd

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebbe14efe580784ef2d4a8d10c70ae1941a7481e531e14d86299a7db46b5ce3a
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:002d107608c7826a92d5ae8fce67a4f6e5aa8a0f467166212b8ba266aac65849
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bde40f127fb70ad4b2cce347d8e8efda6b8c51d0d5d925cba6b936f6910e8a58
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2e9bf29c7ae4e21d29a444d37b6d25cba22b6956008a2d8f62b205eca22b26
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd281ac452aa1b0c543d92e0b78e8cff8976da44b829aabaf0727adabc941d15
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71bdd312318a4e8be7a1364cc8f1a3ca4737c15ac2006ddac7e0ec9431a7cd0a
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e01304b587dd6f964fca04068c3ec50100379a2645a618a43038cf6c309f9b31
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:453419b7857ca38e1a81dec44c26dd0a4122bace0875f6271e643bd72668b555
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -11,3 +11,10 @@
11
  {"current_steps": 100, "total_steps": 165, "loss": 0.5526, "lr": 5e-06, "epoch": 1.8058690744920993, "percentage": 60.61, "elapsed_time": "0:55:15", "remaining_time": "0:35:54"}
12
  {"current_steps": 110, "total_steps": 165, "loss": 0.5525, "lr": 5e-06, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:00:34", "remaining_time": "0:30:17"}
13
  {"current_steps": 110, "total_steps": 165, "eval_loss": 0.5813493132591248, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:01:33", "remaining_time": "0:30:46"}
 
 
 
 
 
 
 
 
11
  {"current_steps": 100, "total_steps": 165, "loss": 0.5526, "lr": 5e-06, "epoch": 1.8058690744920993, "percentage": 60.61, "elapsed_time": "0:55:15", "remaining_time": "0:35:54"}
12
  {"current_steps": 110, "total_steps": 165, "loss": 0.5525, "lr": 5e-06, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:00:34", "remaining_time": "0:30:17"}
13
  {"current_steps": 110, "total_steps": 165, "eval_loss": 0.5813493132591248, "epoch": 1.9864559819413092, "percentage": 66.67, "elapsed_time": "1:01:33", "remaining_time": "0:30:46"}
14
+ {"current_steps": 120, "total_steps": 165, "loss": 0.549, "lr": 5e-06, "epoch": 2.1670428893905194, "percentage": 72.73, "elapsed_time": "1:07:49", "remaining_time": "0:25:26"}
15
+ {"current_steps": 130, "total_steps": 165, "loss": 0.5085, "lr": 5e-06, "epoch": 2.3476297968397293, "percentage": 78.79, "elapsed_time": "1:13:11", "remaining_time": "0:19:42"}
16
+ {"current_steps": 140, "total_steps": 165, "loss": 0.5079, "lr": 5e-06, "epoch": 2.528216704288939, "percentage": 84.85, "elapsed_time": "1:18:32", "remaining_time": "0:14:01"}
17
+ {"current_steps": 150, "total_steps": 165, "loss": 0.5073, "lr": 5e-06, "epoch": 2.708803611738149, "percentage": 90.91, "elapsed_time": "1:23:54", "remaining_time": "0:08:23"}
18
+ {"current_steps": 160, "total_steps": 165, "loss": 0.5138, "lr": 5e-06, "epoch": 2.889390519187359, "percentage": 96.97, "elapsed_time": "1:29:15", "remaining_time": "0:02:47"}
19
+ {"current_steps": 165, "total_steps": 165, "eval_loss": 0.5825901627540588, "epoch": 2.979683972911964, "percentage": 100.0, "elapsed_time": "1:33:52", "remaining_time": "0:00:00"}
20
+ {"current_steps": 165, "total_steps": 165, "epoch": 2.979683972911964, "percentage": 100.0, "elapsed_time": "1:35:05", "remaining_time": "0:00:00"}