Training in progress, epoch 2
Browse files
model-00001-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4949453792
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52fc98c43906faab05c1813e058c87fd219fea801456c4e76953508aacba20bb
|
3 |
size 4949453792
|
model-00002-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999819336
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c68a024292cde277d36cc83965b268b68fa1244aae0d59b667d9afa9aa2bd3ea
|
3 |
size 4999819336
|
model-00003-of-00003.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4546807800
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:035a6b88018731b0495043d2dcbbf3cb07256ba56b758c65ac172bb95207e490
|
3 |
size 4546807800
|
trainer_log.jsonl
CHANGED
@@ -49,3 +49,51 @@
|
|
49 |
{"current_steps": 480, "total_steps": 1419, "loss": 0.2656, "lr": 4.052926668808791e-06, "epoch": 1.014799154334038, "percentage": 33.83, "elapsed_time": "0:47:56", "remaining_time": "1:33:46"}
|
50 |
{"current_steps": 490, "total_steps": 1419, "loss": 0.2439, "lr": 4.009825847318922e-06, "epoch": 1.0359408033826638, "percentage": 34.53, "elapsed_time": "0:48:56", "remaining_time": "1:32:46"}
|
51 |
{"current_steps": 500, "total_steps": 1419, "loss": 0.2422, "lr": 3.966040782112451e-06, "epoch": 1.0570824524312896, "percentage": 35.24, "elapsed_time": "0:49:55", "remaining_time": "1:31:45"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
49 |
{"current_steps": 480, "total_steps": 1419, "loss": 0.2656, "lr": 4.052926668808791e-06, "epoch": 1.014799154334038, "percentage": 33.83, "elapsed_time": "0:47:56", "remaining_time": "1:33:46"}
|
50 |
{"current_steps": 490, "total_steps": 1419, "loss": 0.2439, "lr": 4.009825847318922e-06, "epoch": 1.0359408033826638, "percentage": 34.53, "elapsed_time": "0:48:56", "remaining_time": "1:32:46"}
|
51 |
{"current_steps": 500, "total_steps": 1419, "loss": 0.2422, "lr": 3.966040782112451e-06, "epoch": 1.0570824524312896, "percentage": 35.24, "elapsed_time": "0:49:55", "remaining_time": "1:31:45"}
|
52 |
+
{"current_steps": 510, "total_steps": 1419, "loss": 0.2425, "lr": 3.921595253980836e-06, "epoch": 1.0782241014799154, "percentage": 35.94, "elapsed_time": "0:50:54", "remaining_time": "1:30:44"}
|
53 |
+
{"current_steps": 520, "total_steps": 1419, "loss": 0.2431, "lr": 3.876513402429883e-06, "epoch": 1.0993657505285412, "percentage": 36.65, "elapsed_time": "0:51:54", "remaining_time": "1:29:43"}
|
54 |
+
{"current_steps": 530, "total_steps": 1419, "loss": 0.2413, "lr": 3.83081971256896e-06, "epoch": 1.120507399577167, "percentage": 37.35, "elapsed_time": "0:52:53", "remaining_time": "1:28:42"}
|
55 |
+
{"current_steps": 540, "total_steps": 1419, "loss": 0.2454, "lr": 3.7845390018125065e-06, "epoch": 1.1416490486257929, "percentage": 38.05, "elapsed_time": "0:53:52", "remaining_time": "1:27:41"}
|
56 |
+
{"current_steps": 550, "total_steps": 1419, "loss": 0.2394, "lr": 3.737696406401062e-06, "epoch": 1.1627906976744187, "percentage": 38.76, "elapsed_time": "0:54:52", "remaining_time": "1:26:41"}
|
57 |
+
{"current_steps": 560, "total_steps": 1419, "loss": 0.2448, "lr": 3.6903173677491266e-06, "epoch": 1.1839323467230445, "percentage": 39.46, "elapsed_time": "0:55:51", "remaining_time": "1:25:41"}
|
58 |
+
{"current_steps": 570, "total_steps": 1419, "loss": 0.2437, "lr": 3.642427618627277e-06, "epoch": 1.20507399577167, "percentage": 40.17, "elapsed_time": "0:56:50", "remaining_time": "1:24:40"}
|
59 |
+
{"current_steps": 580, "total_steps": 1419, "loss": 0.2428, "lr": 3.5940531691860405e-06, "epoch": 1.226215644820296, "percentage": 40.87, "elapsed_time": "0:57:50", "remaining_time": "1:23:40"}
|
60 |
+
{"current_steps": 590, "total_steps": 1419, "loss": 0.2403, "lr": 3.545220292829113e-06, "epoch": 1.2473572938689217, "percentage": 41.58, "elapsed_time": "0:58:51", "remaining_time": "1:22:41"}
|
61 |
+
{"current_steps": 600, "total_steps": 1419, "loss": 0.2425, "lr": 3.4959555119436033e-06, "epoch": 1.2684989429175475, "percentage": 42.28, "elapsed_time": "0:59:50", "remaining_time": "1:21:41"}
|
62 |
+
{"current_steps": 610, "total_steps": 1419, "loss": 0.2419, "lr": 3.446285583495041e-06, "epoch": 1.2896405919661733, "percentage": 42.99, "elapsed_time": "1:00:50", "remaining_time": "1:20:41"}
|
63 |
+
{"current_steps": 620, "total_steps": 1419, "loss": 0.2434, "lr": 3.396237484494985e-06, "epoch": 1.3107822410147991, "percentage": 43.69, "elapsed_time": "1:01:49", "remaining_time": "1:19:40"}
|
64 |
+
{"current_steps": 630, "total_steps": 1419, "loss": 0.2413, "lr": 3.345838397349115e-06, "epoch": 1.331923890063425, "percentage": 44.4, "elapsed_time": "1:02:49", "remaining_time": "1:18:40"}
|
65 |
+
{"current_steps": 640, "total_steps": 1419, "loss": 0.243, "lr": 3.2951156950937728e-06, "epoch": 1.3530655391120507, "percentage": 45.1, "elapsed_time": "1:03:47", "remaining_time": "1:17:39"}
|
66 |
+
{"current_steps": 650, "total_steps": 1419, "loss": 0.2421, "lr": 3.2440969265289624e-06, "epoch": 1.3742071881606766, "percentage": 45.81, "elapsed_time": "1:04:46", "remaining_time": "1:16:37"}
|
67 |
+
{"current_steps": 660, "total_steps": 1419, "loss": 0.244, "lr": 3.1928098012558895e-06, "epoch": 1.3953488372093024, "percentage": 46.51, "elapsed_time": "1:05:44", "remaining_time": "1:15:36"}
|
68 |
+
{"current_steps": 670, "total_steps": 1419, "loss": 0.2439, "lr": 3.1412821746271693e-06, "epoch": 1.4164904862579282, "percentage": 47.22, "elapsed_time": "1:06:42", "remaining_time": "1:14:34"}
|
69 |
+
{"current_steps": 680, "total_steps": 1419, "loss": 0.2408, "lr": 3.0895420326178705e-06, "epoch": 1.437632135306554, "percentage": 47.92, "elapsed_time": "1:07:42", "remaining_time": "1:13:34"}
|
70 |
+
{"current_steps": 690, "total_steps": 1419, "loss": 0.2423, "lr": 3.03761747662561e-06, "epoch": 1.4587737843551798, "percentage": 48.63, "elapsed_time": "1:08:42", "remaining_time": "1:12:35"}
|
71 |
+
{"current_steps": 700, "total_steps": 1419, "loss": 0.2401, "lr": 2.985536708207971e-06, "epoch": 1.4799154334038054, "percentage": 49.33, "elapsed_time": "1:09:41", "remaining_time": "1:11:35"}
|
72 |
+
{"current_steps": 710, "total_steps": 1419, "loss": 0.2449, "lr": 2.933328013765505e-06, "epoch": 1.5010570824524314, "percentage": 50.04, "elapsed_time": "1:10:40", "remaining_time": "1:10:34"}
|
73 |
+
{"current_steps": 720, "total_steps": 1419, "loss": 0.2431, "lr": 2.8810197491786714e-06, "epoch": 1.522198731501057, "percentage": 50.74, "elapsed_time": "1:11:40", "remaining_time": "1:09:34"}
|
74 |
+
{"current_steps": 730, "total_steps": 1419, "loss": 0.2414, "lr": 2.8286403244070252e-06, "epoch": 1.543340380549683, "percentage": 51.44, "elapsed_time": "1:12:39", "remaining_time": "1:08:34"}
|
75 |
+
{"current_steps": 740, "total_steps": 1419, "loss": 0.2415, "lr": 2.7762181880590442e-06, "epoch": 1.5644820295983086, "percentage": 52.15, "elapsed_time": "1:13:38", "remaining_time": "1:07:33"}
|
76 |
+
{"current_steps": 750, "total_steps": 1419, "loss": 0.2431, "lr": 2.723781811940956e-06, "epoch": 1.5856236786469344, "percentage": 52.85, "elapsed_time": "1:14:37", "remaining_time": "1:06:33"}
|
77 |
+
{"current_steps": 760, "total_steps": 1419, "loss": 0.2417, "lr": 2.6713596755929755e-06, "epoch": 1.6067653276955602, "percentage": 53.56, "elapsed_time": "1:15:37", "remaining_time": "1:05:34"}
|
78 |
+
{"current_steps": 770, "total_steps": 1419, "loss": 0.2391, "lr": 2.6189802508213297e-06, "epoch": 1.627906976744186, "percentage": 54.26, "elapsed_time": "1:16:35", "remaining_time": "1:04:33"}
|
79 |
+
{"current_steps": 780, "total_steps": 1419, "loss": 0.2445, "lr": 2.5666719862344957e-06, "epoch": 1.6490486257928119, "percentage": 54.97, "elapsed_time": "1:17:35", "remaining_time": "1:03:34"}
|
80 |
+
{"current_steps": 790, "total_steps": 1419, "loss": 0.2409, "lr": 2.51446329179203e-06, "epoch": 1.6701902748414377, "percentage": 55.67, "elapsed_time": "1:18:34", "remaining_time": "1:02:33"}
|
81 |
+
{"current_steps": 800, "total_steps": 1419, "loss": 0.241, "lr": 2.4623825233743896e-06, "epoch": 1.6913319238900635, "percentage": 56.38, "elapsed_time": "1:19:33", "remaining_time": "1:01:33"}
|
82 |
+
{"current_steps": 810, "total_steps": 1419, "loss": 0.2434, "lr": 2.4104579673821297e-06, "epoch": 1.712473572938689, "percentage": 57.08, "elapsed_time": "1:20:33", "remaining_time": "1:00:33"}
|
83 |
+
{"current_steps": 820, "total_steps": 1419, "loss": 0.2413, "lr": 2.358717825372831e-06, "epoch": 1.733615221987315, "percentage": 57.79, "elapsed_time": "1:21:31", "remaining_time": "0:59:33"}
|
84 |
+
{"current_steps": 830, "total_steps": 1419, "loss": 0.2385, "lr": 2.3071901987441116e-06, "epoch": 1.7547568710359407, "percentage": 58.49, "elapsed_time": "1:22:32", "remaining_time": "0:58:34"}
|
85 |
+
{"current_steps": 840, "total_steps": 1419, "loss": 0.2386, "lr": 2.2559030734710396e-06, "epoch": 1.7758985200845667, "percentage": 59.2, "elapsed_time": "1:23:31", "remaining_time": "0:57:34"}
|
86 |
+
{"current_steps": 850, "total_steps": 1419, "loss": 0.2398, "lr": 2.2048843049062275e-06, "epoch": 1.7970401691331923, "percentage": 59.9, "elapsed_time": "1:24:30", "remaining_time": "0:56:34"}
|
87 |
+
{"current_steps": 860, "total_steps": 1419, "loss": 0.2413, "lr": 2.1541616026508854e-06, "epoch": 1.8181818181818183, "percentage": 60.61, "elapsed_time": "1:25:29", "remaining_time": "0:55:34"}
|
88 |
+
{"current_steps": 870, "total_steps": 1419, "loss": 0.2417, "lr": 2.103762515505016e-06, "epoch": 1.839323467230444, "percentage": 61.31, "elapsed_time": "1:26:28", "remaining_time": "0:54:34"}
|
89 |
+
{"current_steps": 880, "total_steps": 1419, "loss": 0.236, "lr": 2.0537144165049597e-06, "epoch": 1.8604651162790697, "percentage": 62.02, "elapsed_time": "1:27:28", "remaining_time": "0:53:34"}
|
90 |
+
{"current_steps": 890, "total_steps": 1419, "loss": 0.2396, "lr": 2.0040444880563974e-06, "epoch": 1.8816067653276956, "percentage": 62.72, "elapsed_time": "1:28:27", "remaining_time": "0:52:34"}
|
91 |
+
{"current_steps": 900, "total_steps": 1419, "loss": 0.2402, "lr": 1.9547797071708873e-06, "epoch": 1.9027484143763214, "percentage": 63.42, "elapsed_time": "1:29:26", "remaining_time": "0:51:34"}
|
92 |
+
{"current_steps": 910, "total_steps": 1419, "loss": 0.2454, "lr": 1.90594683081396e-06, "epoch": 1.9238900634249472, "percentage": 64.13, "elapsed_time": "1:30:26", "remaining_time": "0:50:35"}
|
93 |
+
{"current_steps": 920, "total_steps": 1419, "loss": 0.241, "lr": 1.8575723813727234e-06, "epoch": 1.945031712473573, "percentage": 64.83, "elapsed_time": "1:31:25", "remaining_time": "0:49:35"}
|
94 |
+
{"current_steps": 930, "total_steps": 1419, "loss": 0.2377, "lr": 1.8096826322508745e-06, "epoch": 1.9661733615221988, "percentage": 65.54, "elapsed_time": "1:32:24", "remaining_time": "0:48:35"}
|
95 |
+
{"current_steps": 940, "total_steps": 1419, "loss": 0.2363, "lr": 1.7623035935989388e-06, "epoch": 1.9873150105708244, "percentage": 66.24, "elapsed_time": "1:33:24", "remaining_time": "0:47:35"}
|
96 |
+
{"current_steps": 946, "total_steps": 1419, "eval_loss": 0.3176339268684387, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "1:34:46", "remaining_time": "0:47:23"}
|
97 |
+
{"current_steps": 950, "total_steps": 1419, "loss": 0.2124, "lr": 1.7154609981874945e-06, "epoch": 2.0084566596194504, "percentage": 66.95, "elapsed_time": "1:36:23", "remaining_time": "0:47:35"}
|
98 |
+
{"current_steps": 960, "total_steps": 1419, "loss": 0.1655, "lr": 1.6691802874310402e-06, "epoch": 2.029598308668076, "percentage": 67.65, "elapsed_time": "1:37:24", "remaining_time": "0:46:34"}
|
99 |
+
{"current_steps": 970, "total_steps": 1419, "loss": 0.1695, "lr": 1.6234865975701169e-06, "epoch": 2.050739957716702, "percentage": 68.36, "elapsed_time": "1:38:23", "remaining_time": "0:45:32"}
|