Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1318a1bcfdee31bc1b003ae95c6909d331852fd42216e93c5206e00197c7a864
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ed6b3c86b88bd406398907edca4f8776e7725a0d769800dadca1e3cb1f4c96e
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b1706786e7076f88274f0f1d6b01c686ea11122bcede8c2dde3c2c3adda19e4
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2acc545a2cb5fac4097c730fc60932ca14b7367f2fe0c6f7553ccbe975955098
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -22,3 +22,26 @@
|
|
22 |
{"current_steps": 220, "total_steps": 675, "loss": 0.4061, "lr": 5e-06, "epoch": 0.9750692520775623, "percentage": 32.59, "elapsed_time": "1:57:26", "remaining_time": "4:02:52"}
|
23 |
{"current_steps": 225, "total_steps": 675, "eval_loss": 0.4077036678791046, "epoch": 0.997229916897507, "percentage": 33.33, "elapsed_time": "2:03:03", "remaining_time": "4:06:07"}
|
24 |
{"current_steps": 230, "total_steps": 675, "loss": 0.4093, "lr": 5e-06, "epoch": 1.0193905817174516, "percentage": 34.07, "elapsed_time": "2:06:40", "remaining_time": "4:05:04"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
22 |
{"current_steps": 220, "total_steps": 675, "loss": 0.4061, "lr": 5e-06, "epoch": 0.9750692520775623, "percentage": 32.59, "elapsed_time": "1:57:26", "remaining_time": "4:02:52"}
|
23 |
{"current_steps": 225, "total_steps": 675, "eval_loss": 0.4077036678791046, "epoch": 0.997229916897507, "percentage": 33.33, "elapsed_time": "2:03:03", "remaining_time": "4:06:07"}
|
24 |
{"current_steps": 230, "total_steps": 675, "loss": 0.4093, "lr": 5e-06, "epoch": 1.0193905817174516, "percentage": 34.07, "elapsed_time": "2:06:40", "remaining_time": "4:05:04"}
|
25 |
+
{"current_steps": 240, "total_steps": 675, "loss": 0.3815, "lr": 5e-06, "epoch": 1.0637119113573408, "percentage": 35.56, "elapsed_time": "2:12:01", "remaining_time": "3:59:17"}
|
26 |
+
{"current_steps": 250, "total_steps": 675, "loss": 0.3761, "lr": 5e-06, "epoch": 1.10803324099723, "percentage": 37.04, "elapsed_time": "2:17:22", "remaining_time": "3:53:31"}
|
27 |
+
{"current_steps": 260, "total_steps": 675, "loss": 0.3818, "lr": 5e-06, "epoch": 1.1523545706371192, "percentage": 38.52, "elapsed_time": "2:22:45", "remaining_time": "3:47:51"}
|
28 |
+
{"current_steps": 270, "total_steps": 675, "loss": 0.3792, "lr": 5e-06, "epoch": 1.1966759002770084, "percentage": 40.0, "elapsed_time": "2:28:07", "remaining_time": "3:42:11"}
|
29 |
+
{"current_steps": 280, "total_steps": 675, "loss": 0.3768, "lr": 5e-06, "epoch": 1.2409972299168974, "percentage": 41.48, "elapsed_time": "2:33:29", "remaining_time": "3:36:32"}
|
30 |
+
{"current_steps": 290, "total_steps": 675, "loss": 0.3813, "lr": 5e-06, "epoch": 1.2853185595567866, "percentage": 42.96, "elapsed_time": "2:38:51", "remaining_time": "3:30:53"}
|
31 |
+
{"current_steps": 300, "total_steps": 675, "loss": 0.3819, "lr": 5e-06, "epoch": 1.3296398891966759, "percentage": 44.44, "elapsed_time": "2:44:12", "remaining_time": "3:25:15"}
|
32 |
+
{"current_steps": 310, "total_steps": 675, "loss": 0.38, "lr": 5e-06, "epoch": 1.373961218836565, "percentage": 45.93, "elapsed_time": "2:49:34", "remaining_time": "3:19:39"}
|
33 |
+
{"current_steps": 320, "total_steps": 675, "loss": 0.3755, "lr": 5e-06, "epoch": 1.4182825484764543, "percentage": 47.41, "elapsed_time": "2:54:57", "remaining_time": "3:14:05"}
|
34 |
+
{"current_steps": 330, "total_steps": 675, "loss": 0.3808, "lr": 5e-06, "epoch": 1.4626038781163435, "percentage": 48.89, "elapsed_time": "3:00:19", "remaining_time": "3:08:31"}
|
35 |
+
{"current_steps": 340, "total_steps": 675, "loss": 0.3778, "lr": 5e-06, "epoch": 1.5069252077562327, "percentage": 50.37, "elapsed_time": "3:05:41", "remaining_time": "3:02:57"}
|
36 |
+
{"current_steps": 350, "total_steps": 675, "loss": 0.3779, "lr": 5e-06, "epoch": 1.5512465373961217, "percentage": 51.85, "elapsed_time": "3:11:03", "remaining_time": "2:57:24"}
|
37 |
+
{"current_steps": 360, "total_steps": 675, "loss": 0.374, "lr": 5e-06, "epoch": 1.595567867036011, "percentage": 53.33, "elapsed_time": "3:16:24", "remaining_time": "2:51:51"}
|
38 |
+
{"current_steps": 370, "total_steps": 675, "loss": 0.3776, "lr": 5e-06, "epoch": 1.6398891966759002, "percentage": 54.81, "elapsed_time": "3:21:46", "remaining_time": "2:46:19"}
|
39 |
+
{"current_steps": 380, "total_steps": 675, "loss": 0.3805, "lr": 5e-06, "epoch": 1.6842105263157894, "percentage": 56.3, "elapsed_time": "3:27:08", "remaining_time": "2:40:48"}
|
40 |
+
{"current_steps": 390, "total_steps": 675, "loss": 0.3776, "lr": 5e-06, "epoch": 1.7285318559556786, "percentage": 57.78, "elapsed_time": "3:32:30", "remaining_time": "2:35:17"}
|
41 |
+
{"current_steps": 400, "total_steps": 675, "loss": 0.3759, "lr": 5e-06, "epoch": 1.7728531855955678, "percentage": 59.26, "elapsed_time": "3:37:52", "remaining_time": "2:29:47"}
|
42 |
+
{"current_steps": 410, "total_steps": 675, "loss": 0.3797, "lr": 5e-06, "epoch": 1.817174515235457, "percentage": 60.74, "elapsed_time": "3:43:12", "remaining_time": "2:24:16"}
|
43 |
+
{"current_steps": 420, "total_steps": 675, "loss": 0.3736, "lr": 5e-06, "epoch": 1.8614958448753463, "percentage": 62.22, "elapsed_time": "3:48:33", "remaining_time": "2:18:46"}
|
44 |
+
{"current_steps": 430, "total_steps": 675, "loss": 0.3761, "lr": 5e-06, "epoch": 1.9058171745152355, "percentage": 63.7, "elapsed_time": "3:53:56", "remaining_time": "2:13:17"}
|
45 |
+
{"current_steps": 440, "total_steps": 675, "loss": 0.3731, "lr": 5e-06, "epoch": 1.9501385041551247, "percentage": 65.19, "elapsed_time": "3:59:17", "remaining_time": "2:07:48"}
|
46 |
+
{"current_steps": 450, "total_steps": 675, "loss": 0.3726, "lr": 5e-06, "epoch": 1.994459833795014, "percentage": 66.67, "elapsed_time": "4:04:37", "remaining_time": "2:02:18"}
|
47 |
+
{"current_steps": 451, "total_steps": 675, "eval_loss": 0.3975733816623688, "epoch": 1.9988919667590028, "percentage": 66.81, "elapsed_time": "4:07:48", "remaining_time": "2:03:04"}
|