sedrickkeh commited on
Commit
0423a8f
·
verified ·
1 Parent(s): e74aee1

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:496c663a15e1716834b2ba165fd080cd239c1fb6c5a4508eb6f524bf0e5cc956
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2279fe66849158fb64c40d3eb08e49a75b50c07246a5a462fef74c738752aa50
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:946dce15cd5ea13e6e2b18cd0933e55d229170e08d8b13e070fea11e31c5baab
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e99976b48e522006f40fd4d146546d4a6ecf5e24da95e5b44f9fa833c01211f0
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22be6a9b03881f64bfa92906b0b4190ecd1827bf11c9312f600df33ae86b8707
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a803a85980fc6c9c5aed172005bfa752f771c5e179ca4612b4068c32ef67dd4a
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54582bdca0d596cb49b9e26fb11168942353c18b1aa71710f7af40c878ba04a9
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:113bb9aa3a2605e915daa8a2fa9a1a237077a4f1167e19d49d6ea205bc049a7e
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -8,3 +8,8 @@
8
  {"current_steps": 70, "total_steps": 117, "loss": 0.4657, "lr": 5e-06, "epoch": 1.7948717948717947, "percentage": 59.83, "elapsed_time": "1:08:59", "remaining_time": "0:46:19"}
9
  {"current_steps": 78, "total_steps": 117, "eval_loss": 0.48121070861816406, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:17:21", "remaining_time": "0:38:40"}
10
  {"current_steps": 80, "total_steps": 117, "loss": 0.4509, "lr": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "1:20:27", "remaining_time": "0:37:12"}
 
 
 
 
 
 
8
  {"current_steps": 70, "total_steps": 117, "loss": 0.4657, "lr": 5e-06, "epoch": 1.7948717948717947, "percentage": 59.83, "elapsed_time": "1:08:59", "remaining_time": "0:46:19"}
9
  {"current_steps": 78, "total_steps": 117, "eval_loss": 0.48121070861816406, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:17:21", "remaining_time": "0:38:40"}
10
  {"current_steps": 80, "total_steps": 117, "loss": 0.4509, "lr": 5e-06, "epoch": 2.051282051282051, "percentage": 68.38, "elapsed_time": "1:20:27", "remaining_time": "0:37:12"}
11
+ {"current_steps": 90, "total_steps": 117, "loss": 0.4352, "lr": 5e-06, "epoch": 2.3076923076923075, "percentage": 76.92, "elapsed_time": "1:30:03", "remaining_time": "0:27:01"}
12
+ {"current_steps": 100, "total_steps": 117, "loss": 0.4268, "lr": 5e-06, "epoch": 2.564102564102564, "percentage": 85.47, "elapsed_time": "1:39:40", "remaining_time": "0:16:56"}
13
+ {"current_steps": 110, "total_steps": 117, "loss": 0.4298, "lr": 5e-06, "epoch": 2.8205128205128203, "percentage": 94.02, "elapsed_time": "1:49:16", "remaining_time": "0:06:57"}
14
+ {"current_steps": 117, "total_steps": 117, "eval_loss": 0.4801027178764343, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:57:53", "remaining_time": "0:00:00"}
15
+ {"current_steps": 117, "total_steps": 117, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "1:59:07", "remaining_time": "0:00:00"}