EtashGuha commited on
Commit
43b65e4
·
verified ·
1 Parent(s): 1003abd

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21994109ae0d879ee376636b53ef78d87c342a3f72dbcaa4275b9782ed4cd118
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10f40044d7b17ce24f62f6ce38c85841b8bf8ab6a6c3194b5fb62615602e69dd
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c7c1fe795ce34d36550af28018883a76e45644795c3b22b59b2d684a488fb7e
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88213520c000e5588cf74d852d57c164dc098609594b8a3cb88cf0ef2fcd9ad3
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:490729c6413b5dba0f4459292ab4d5f0221cce8d8b61fb73d4407979903d6038
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70ee644f4419a50d381d2031d9e3df55ded715ec2fb4675c4f87db0c933c6b7b
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eea64edddfebb4095db6fa6eb36f63a8461662fce4c1d2986b79c8d2767d54a2
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4817076e908f5e38543e99e3ca023a71c6ecd39c27df2e9f8dec38ac03d8c20c
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -2,3 +2,8 @@
2
  {"current_steps": 20, "total_steps": 108, "loss": 0.9352, "lr": 5e-06, "epoch": 0.5517241379310345, "percentage": 18.52, "elapsed_time": "0:51:59", "remaining_time": "3:48:44"}
3
  {"current_steps": 30, "total_steps": 108, "loss": 0.8976, "lr": 5e-06, "epoch": 0.8275862068965517, "percentage": 27.78, "elapsed_time": "1:17:57", "remaining_time": "3:22:40"}
4
  {"current_steps": 36, "total_steps": 108, "eval_loss": 0.8847346901893616, "epoch": 0.993103448275862, "percentage": 33.33, "elapsed_time": "1:36:09", "remaining_time": "3:12:19"}
 
 
 
 
 
 
2
  {"current_steps": 20, "total_steps": 108, "loss": 0.9352, "lr": 5e-06, "epoch": 0.5517241379310345, "percentage": 18.52, "elapsed_time": "0:51:59", "remaining_time": "3:48:44"}
3
  {"current_steps": 30, "total_steps": 108, "loss": 0.8976, "lr": 5e-06, "epoch": 0.8275862068965517, "percentage": 27.78, "elapsed_time": "1:17:57", "remaining_time": "3:22:40"}
4
  {"current_steps": 36, "total_steps": 108, "eval_loss": 0.8847346901893616, "epoch": 0.993103448275862, "percentage": 33.33, "elapsed_time": "1:36:09", "remaining_time": "3:12:19"}
5
+ {"current_steps": 40, "total_steps": 108, "loss": 0.8669, "lr": 5e-06, "epoch": 1.103448275862069, "percentage": 37.04, "elapsed_time": "1:47:22", "remaining_time": "3:02:32"}
6
+ {"current_steps": 50, "total_steps": 108, "loss": 0.832, "lr": 5e-06, "epoch": 1.3793103448275863, "percentage": 46.3, "elapsed_time": "2:13:18", "remaining_time": "2:34:38"}
7
+ {"current_steps": 60, "total_steps": 108, "loss": 0.8196, "lr": 5e-06, "epoch": 1.6551724137931034, "percentage": 55.56, "elapsed_time": "2:39:13", "remaining_time": "2:07:23"}
8
+ {"current_steps": 70, "total_steps": 108, "loss": 0.8134, "lr": 5e-06, "epoch": 1.9310344827586206, "percentage": 64.81, "elapsed_time": "3:05:08", "remaining_time": "1:40:30"}
9
+ {"current_steps": 72, "total_steps": 108, "eval_loss": 0.8555252552032471, "epoch": 1.986206896551724, "percentage": 66.67, "elapsed_time": "3:13:30", "remaining_time": "1:36:45"}