Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f32be30d71ab482614b34cb7b9be6145b6db2ba168e6ccc0c787665f22a280d
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d54e0668796c376e3dde689708f25080420f11b6247b8030f5f573a477c961da
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecf2a138718acfc5cfb09c89cc5ac7ea6389b6f8b9e0bcbd686706f562551275
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfd321f0abc60182ac54d4b174858fc24f49223ce88aba6ff17c7b3f4a2288af
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -33,3 +33,20 @@
|
|
33 |
{"current_steps": 320, "total_steps": 501, "loss": 0.7196, "lr": 5e-06, "epoch": 1.9076005961251863, "percentage": 63.87, "elapsed_time": "5:12:41", "remaining_time": "2:56:51"}
|
34 |
{"current_steps": 330, "total_steps": 501, "loss": 0.7274, "lr": 5e-06, "epoch": 1.9672131147540983, "percentage": 65.87, "elapsed_time": "5:22:20", "remaining_time": "2:47:01"}
|
35 |
{"current_steps": 335, "total_steps": 501, "eval_loss": 0.7537275552749634, "epoch": 1.9970193740685542, "percentage": 66.87, "elapsed_time": "5:30:31", "remaining_time": "2:43:46"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
{"current_steps": 320, "total_steps": 501, "loss": 0.7196, "lr": 5e-06, "epoch": 1.9076005961251863, "percentage": 63.87, "elapsed_time": "5:12:41", "remaining_time": "2:56:51"}
|
34 |
{"current_steps": 330, "total_steps": 501, "loss": 0.7274, "lr": 5e-06, "epoch": 1.9672131147540983, "percentage": 65.87, "elapsed_time": "5:22:20", "remaining_time": "2:47:01"}
|
35 |
{"current_steps": 335, "total_steps": 501, "eval_loss": 0.7537275552749634, "epoch": 1.9970193740685542, "percentage": 66.87, "elapsed_time": "5:30:31", "remaining_time": "2:43:46"}
|
36 |
+
{"current_steps": 340, "total_steps": 501, "loss": 0.7213, "lr": 5e-06, "epoch": 2.0268256333830106, "percentage": 67.86, "elapsed_time": "5:36:05", "remaining_time": "2:39:08"}
|
37 |
+
{"current_steps": 350, "total_steps": 501, "loss": 0.6748, "lr": 5e-06, "epoch": 2.0864381520119224, "percentage": 69.86, "elapsed_time": "5:45:42", "remaining_time": "2:29:08"}
|
38 |
+
{"current_steps": 360, "total_steps": 501, "loss": 0.6786, "lr": 5e-06, "epoch": 2.1460506706408347, "percentage": 71.86, "elapsed_time": "5:55:20", "remaining_time": "2:19:10"}
|
39 |
+
{"current_steps": 370, "total_steps": 501, "loss": 0.6768, "lr": 5e-06, "epoch": 2.2056631892697465, "percentage": 73.85, "elapsed_time": "6:05:00", "remaining_time": "2:09:13"}
|
40 |
+
{"current_steps": 380, "total_steps": 501, "loss": 0.6779, "lr": 5e-06, "epoch": 2.2652757078986587, "percentage": 75.85, "elapsed_time": "6:14:38", "remaining_time": "1:59:17"}
|
41 |
+
{"current_steps": 390, "total_steps": 501, "loss": 0.6764, "lr": 5e-06, "epoch": 2.3248882265275705, "percentage": 77.84, "elapsed_time": "6:24:16", "remaining_time": "1:49:22"}
|
42 |
+
{"current_steps": 400, "total_steps": 501, "loss": 0.6782, "lr": 5e-06, "epoch": 2.384500745156483, "percentage": 79.84, "elapsed_time": "6:33:56", "remaining_time": "1:39:28"}
|
43 |
+
{"current_steps": 410, "total_steps": 501, "loss": 0.6723, "lr": 5e-06, "epoch": 2.444113263785395, "percentage": 81.84, "elapsed_time": "6:43:35", "remaining_time": "1:29:34"}
|
44 |
+
{"current_steps": 420, "total_steps": 501, "loss": 0.6771, "lr": 5e-06, "epoch": 2.503725782414307, "percentage": 83.83, "elapsed_time": "6:53:13", "remaining_time": "1:19:41"}
|
45 |
+
{"current_steps": 430, "total_steps": 501, "loss": 0.6772, "lr": 5e-06, "epoch": 2.563338301043219, "percentage": 85.83, "elapsed_time": "7:02:51", "remaining_time": "1:09:49"}
|
46 |
+
{"current_steps": 440, "total_steps": 501, "loss": 0.6771, "lr": 5e-06, "epoch": 2.6229508196721314, "percentage": 87.82, "elapsed_time": "7:12:30", "remaining_time": "0:59:57"}
|
47 |
+
{"current_steps": 450, "total_steps": 501, "loss": 0.6777, "lr": 5e-06, "epoch": 2.682563338301043, "percentage": 89.82, "elapsed_time": "7:22:08", "remaining_time": "0:50:06"}
|
48 |
+
{"current_steps": 460, "total_steps": 501, "loss": 0.6745, "lr": 5e-06, "epoch": 2.742175856929955, "percentage": 91.82, "elapsed_time": "7:31:48", "remaining_time": "0:40:16"}
|
49 |
+
{"current_steps": 470, "total_steps": 501, "loss": 0.6781, "lr": 5e-06, "epoch": 2.8017883755588673, "percentage": 93.81, "elapsed_time": "7:41:27", "remaining_time": "0:30:26"}
|
50 |
+
{"current_steps": 480, "total_steps": 501, "loss": 0.6794, "lr": 5e-06, "epoch": 2.8614008941877795, "percentage": 95.81, "elapsed_time": "7:51:06", "remaining_time": "0:20:36"}
|
51 |
+
{"current_steps": 490, "total_steps": 501, "loss": 0.6742, "lr": 5e-06, "epoch": 2.9210134128166914, "percentage": 97.8, "elapsed_time": "8:00:45", "remaining_time": "0:10:47"}
|
52 |
+
{"current_steps": 500, "total_steps": 501, "loss": 0.6854, "lr": 5e-06, "epoch": 2.9806259314456036, "percentage": 99.8, "elapsed_time": "8:10:22", "remaining_time": "0:00:58"}
|