sedrickkeh commited on
Commit
3dc38d8
·
verified ·
1 Parent(s): b872fca

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dab89e6e74f74dbad64f3b5941d5c7fcf6cc94e6b0e6e73c35cd12036bf828f2
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74a3b7dd8b41c1ab3433abe937c0473f28663ed514225454f795f299a4358e65
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c3da36d8d36d8fcbe77064311abd22ac1f02f10d15d6a119097ed2ff868ac1b
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dd69cd3d712c2074be77aa7b2e9564cefe8748c684a426e4ba415abcabf4d1a
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f133b2b4b694584677e1aae510329992dcdeb9eb14b4a5a6839af4515c84631c
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a09a815060ca1e243f8b2d722c8793c75dbc687bf0f60a535d4e79cd6fad037
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3e8502d0a46ce4a64f98a01149bf522b4381b127a0666179fc55026eba373ac
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e62e4b8b3b9059daf60f287665555a5b3dca0eb1937cbd9fec70a7cfb2b7136
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -5,3 +5,8 @@
5
  {"current_steps": 40, "total_steps": 84, "loss": 0.9925, "lr": 5e-06, "epoch": 1.4166666666666667, "percentage": 47.62, "elapsed_time": "0:22:43", "remaining_time": "0:24:59"}
6
  {"current_steps": 50, "total_steps": 84, "loss": 0.9729, "lr": 5e-06, "epoch": 1.7675438596491229, "percentage": 59.52, "elapsed_time": "0:27:58", "remaining_time": "0:19:01"}
7
  {"current_steps": 56, "total_steps": 84, "eval_loss": 0.9812449812889099, "epoch": 1.9780701754385965, "percentage": 66.67, "elapsed_time": "0:31:33", "remaining_time": "0:15:46"}
 
 
 
 
 
 
5
  {"current_steps": 40, "total_steps": 84, "loss": 0.9925, "lr": 5e-06, "epoch": 1.4166666666666667, "percentage": 47.62, "elapsed_time": "0:22:43", "remaining_time": "0:24:59"}
6
  {"current_steps": 50, "total_steps": 84, "loss": 0.9729, "lr": 5e-06, "epoch": 1.7675438596491229, "percentage": 59.52, "elapsed_time": "0:27:58", "remaining_time": "0:19:01"}
7
  {"current_steps": 56, "total_steps": 84, "eval_loss": 0.9812449812889099, "epoch": 1.9780701754385965, "percentage": 66.67, "elapsed_time": "0:31:33", "remaining_time": "0:15:46"}
8
+ {"current_steps": 60, "total_steps": 84, "loss": 1.0281, "lr": 5e-06, "epoch": 2.1315789473684212, "percentage": 71.43, "elapsed_time": "0:34:48", "remaining_time": "0:13:55"}
9
+ {"current_steps": 70, "total_steps": 84, "loss": 0.9086, "lr": 5e-06, "epoch": 2.482456140350877, "percentage": 83.33, "elapsed_time": "0:40:02", "remaining_time": "0:08:00"}
10
+ {"current_steps": 80, "total_steps": 84, "loss": 0.9026, "lr": 5e-06, "epoch": 2.8333333333333335, "percentage": 95.24, "elapsed_time": "0:45:16", "remaining_time": "0:02:15"}
11
+ {"current_steps": 84, "total_steps": 84, "eval_loss": 0.9630991816520691, "epoch": 2.973684210526316, "percentage": 100.0, "elapsed_time": "0:48:58", "remaining_time": "0:00:00"}
12
+ {"current_steps": 84, "total_steps": 84, "epoch": 2.973684210526316, "percentage": 100.0, "elapsed_time": "0:50:12", "remaining_time": "0:00:00"}