sedrickkeh commited on
Commit
23fde87
·
verified ·
1 Parent(s): 4e0d318

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbd6f5d4fd89a11bf5edbd7ae4ea2220f0e73b67fad5f07166b23a3ef1132b4b
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f3dad0a26aea98709f4868c9d9f791d25b61b94cee3bed41983db7822afb93a
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68c191814a2ff0fc415b98df100ed95cb1cb37eacedf0616d6867747a138c22f
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d2760249711ebf5e9dcd4e9df10a3776769493c14ea2b70a9123ae1b8cba2a7
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9134586b467e212c5e74fc89286eeceac053527afeca6ef665525a6e185893a
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:919997a6ee7e79f6f144f19cbe4577a08c0106c47646515d648224354eb1a15c
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92a7f86b8357cd5059b9e93cd562b395cea20faf9dbf385365d9bb24255cbe79
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8beb3db21848b4254d2e32b46ee1cf963972d726cc1dc66fe9337d141eec07e0
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -10,3 +10,10 @@
10
  {"current_steps": 90, "total_steps": 150, "loss": 0.5397, "lr": 5e-06, "epoch": 1.7955112219451372, "percentage": 60.0, "elapsed_time": "1:26:57", "remaining_time": "0:57:58"}
11
  {"current_steps": 100, "total_steps": 150, "loss": 0.5438, "lr": 5e-06, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:36:23", "remaining_time": "0:48:11"}
12
  {"current_steps": 100, "total_steps": 150, "eval_loss": 0.5740869641304016, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:37:29", "remaining_time": "0:48:44"}
 
 
 
 
 
 
 
 
10
  {"current_steps": 90, "total_steps": 150, "loss": 0.5397, "lr": 5e-06, "epoch": 1.7955112219451372, "percentage": 60.0, "elapsed_time": "1:26:57", "remaining_time": "0:57:58"}
11
  {"current_steps": 100, "total_steps": 150, "loss": 0.5438, "lr": 5e-06, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:36:23", "remaining_time": "0:48:11"}
12
  {"current_steps": 100, "total_steps": 150, "eval_loss": 0.5740869641304016, "epoch": 1.9950124688279303, "percentage": 66.67, "elapsed_time": "1:37:29", "remaining_time": "0:48:44"}
13
+ {"current_steps": 110, "total_steps": 150, "loss": 0.5407, "lr": 5e-06, "epoch": 2.1945137157107233, "percentage": 73.33, "elapsed_time": "1:47:51", "remaining_time": "0:39:13"}
14
+ {"current_steps": 120, "total_steps": 150, "loss": 0.4996, "lr": 5e-06, "epoch": 2.3940149625935163, "percentage": 80.0, "elapsed_time": "1:57:16", "remaining_time": "0:29:19"}
15
+ {"current_steps": 130, "total_steps": 150, "loss": 0.4972, "lr": 5e-06, "epoch": 2.5935162094763093, "percentage": 86.67, "elapsed_time": "2:06:44", "remaining_time": "0:19:29"}
16
+ {"current_steps": 140, "total_steps": 150, "loss": 0.4926, "lr": 5e-06, "epoch": 2.7930174563591024, "percentage": 93.33, "elapsed_time": "2:16:11", "remaining_time": "0:09:43"}
17
+ {"current_steps": 150, "total_steps": 150, "loss": 0.4952, "lr": 5e-06, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:25:37", "remaining_time": "0:00:00"}
18
+ {"current_steps": 150, "total_steps": 150, "eval_loss": 0.5672302842140198, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:27:42", "remaining_time": "0:00:00"}
19
+ {"current_steps": 150, "total_steps": 150, "epoch": 2.9925187032418954, "percentage": 100.0, "elapsed_time": "2:28:56", "remaining_time": "0:00:00"}