sedrickkeh commited on
Commit
6b55506
·
verified ·
1 Parent(s): 11f010e

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f016136132f4992579f973056cd927cb3cc96b0d4350661cc7e9415c6a165ac
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40c3c73d6199d9c3aa0d633d65f31bc5e1be476706074d462dd73f49217449c1
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1dd41f730317be2df46f6b7c3f0b1bcb742bb96ceb8b9ac39aee8f434fe7cf3
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:429fa6ce701bb6511d924159d25dfc439cd3b12e16ba3ee787b4d7f6d9756c04
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:330f1f76d6848fea3a9de0f4f29f5d82acea7f483686519799739b24d8b3d18e
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5dfe6d9038932791cc7044026f02a34ae49c96df53ec0b89c74c31096b6ee7fb
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53b8cdb5cf70332b2df084bec10525f947801b750e957a68ee1468dcd00f9177
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e865249a2e15deeeae1b93283833f4728b34d25350f07196bb2668b24f8e27db
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -9,3 +9,9 @@
9
  {"current_steps": 80, "total_steps": 132, "loss": 0.8393, "lr": 5e-06, "epoch": 1.7927170868347337, "percentage": 60.61, "elapsed_time": "0:44:26", "remaining_time": "0:28:53"}
10
  {"current_steps": 89, "total_steps": 132, "eval_loss": 0.8523734211921692, "epoch": 1.9943977591036415, "percentage": 67.42, "elapsed_time": "0:49:49", "remaining_time": "0:24:04"}
11
  {"current_steps": 90, "total_steps": 132, "loss": 0.8585, "lr": 5e-06, "epoch": 2.0168067226890756, "percentage": 68.18, "elapsed_time": "0:51:30", "remaining_time": "0:24:02"}
 
 
 
 
 
 
 
9
  {"current_steps": 80, "total_steps": 132, "loss": 0.8393, "lr": 5e-06, "epoch": 1.7927170868347337, "percentage": 60.61, "elapsed_time": "0:44:26", "remaining_time": "0:28:53"}
10
  {"current_steps": 89, "total_steps": 132, "eval_loss": 0.8523734211921692, "epoch": 1.9943977591036415, "percentage": 67.42, "elapsed_time": "0:49:49", "remaining_time": "0:24:04"}
11
  {"current_steps": 90, "total_steps": 132, "loss": 0.8585, "lr": 5e-06, "epoch": 2.0168067226890756, "percentage": 68.18, "elapsed_time": "0:51:30", "remaining_time": "0:24:02"}
12
+ {"current_steps": 100, "total_steps": 132, "loss": 0.7773, "lr": 5e-06, "epoch": 2.2408963585434174, "percentage": 75.76, "elapsed_time": "0:56:51", "remaining_time": "0:18:11"}
13
+ {"current_steps": 110, "total_steps": 132, "loss": 0.7786, "lr": 5e-06, "epoch": 2.4649859943977592, "percentage": 83.33, "elapsed_time": "1:02:13", "remaining_time": "0:12:26"}
14
+ {"current_steps": 120, "total_steps": 132, "loss": 0.7664, "lr": 5e-06, "epoch": 2.689075630252101, "percentage": 90.91, "elapsed_time": "1:07:33", "remaining_time": "0:06:45"}
15
+ {"current_steps": 130, "total_steps": 132, "loss": 0.7699, "lr": 5e-06, "epoch": 2.9131652661064424, "percentage": 98.48, "elapsed_time": "1:12:54", "remaining_time": "0:01:07"}
16
+ {"current_steps": 132, "total_steps": 132, "eval_loss": 0.8426499366760254, "epoch": 2.957983193277311, "percentage": 100.0, "elapsed_time": "1:15:47", "remaining_time": "0:00:00"}
17
+ {"current_steps": 132, "total_steps": 132, "epoch": 2.957983193277311, "percentage": 100.0, "elapsed_time": "1:17:01", "remaining_time": "0:00:00"}