Training in progress, step 150
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +50 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 828527688
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4e231f1e511a21a6e17d9eb7f78befd6ce49c2a0bb20a26631bc845ce3e8301
|
3 |
size 828527688
|
trainer_log.jsonl
CHANGED
@@ -102,3 +102,53 @@
|
|
102 |
{"current_steps": 102, "total_steps": 154, "loss": 0.2465, "lr": 1.2947162435741278e-05, "epoch": 1.3246753246753247, "percentage": 66.23, "elapsed_time": "0:16:58", "remaining_time": "0:08:39"}
|
103 |
{"current_steps": 103, "total_steps": 154, "loss": 0.2241, "lr": 1.2500000000000006e-05, "epoch": 1.3376623376623376, "percentage": 66.88, "elapsed_time": "0:17:07", "remaining_time": "0:08:28"}
|
104 |
{"current_steps": 104, "total_steps": 154, "loss": 0.2248, "lr": 1.205810757666894e-05, "epoch": 1.3506493506493507, "percentage": 67.53, "elapsed_time": "0:17:16", "remaining_time": "0:08:18"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
102 |
{"current_steps": 102, "total_steps": 154, "loss": 0.2465, "lr": 1.2947162435741278e-05, "epoch": 1.3246753246753247, "percentage": 66.23, "elapsed_time": "0:16:58", "remaining_time": "0:08:39"}
|
103 |
{"current_steps": 103, "total_steps": 154, "loss": 0.2241, "lr": 1.2500000000000006e-05, "epoch": 1.3376623376623376, "percentage": 66.88, "elapsed_time": "0:17:07", "remaining_time": "0:08:28"}
|
104 |
{"current_steps": 104, "total_steps": 154, "loss": 0.2248, "lr": 1.205810757666894e-05, "epoch": 1.3506493506493507, "percentage": 67.53, "elapsed_time": "0:17:16", "remaining_time": "0:08:18"}
|
105 |
+
{"current_steps": 105, "total_steps": 154, "loss": 0.2031, "lr": 1.1621671468032493e-05, "epoch": 1.3636363636363638, "percentage": 68.18, "elapsed_time": "0:17:25", "remaining_time": "0:08:07"}
|
106 |
+
{"current_steps": 106, "total_steps": 154, "loss": 0.2423, "lr": 1.1190875675987356e-05, "epoch": 1.3766233766233766, "percentage": 68.83, "elapsed_time": "0:17:34", "remaining_time": "0:07:57"}
|
107 |
+
{"current_steps": 107, "total_steps": 154, "loss": 0.2267, "lr": 1.0765901824467167e-05, "epoch": 1.3896103896103895, "percentage": 69.48, "elapsed_time": "0:17:42", "remaining_time": "0:07:46"}
|
108 |
+
{"current_steps": 108, "total_steps": 154, "loss": 0.2263, "lr": 1.0346929082869641e-05, "epoch": 1.4025974025974026, "percentage": 70.13, "elapsed_time": "0:17:51", "remaining_time": "0:07:36"}
|
109 |
+
{"current_steps": 109, "total_steps": 154, "loss": 0.1941, "lr": 9.934134090518593e-06, "epoch": 1.4155844155844157, "percentage": 70.78, "elapsed_time": "0:18:00", "remaining_time": "0:07:25"}
|
110 |
+
{"current_steps": 110, "total_steps": 154, "loss": 0.2211, "lr": 9.527690882192636e-06, "epoch": 1.4285714285714286, "percentage": 71.43, "elapsed_time": "0:18:09", "remaining_time": "0:07:15"}
|
111 |
+
{"current_steps": 111, "total_steps": 154, "loss": 0.2175, "lr": 9.127770814751933e-06, "epoch": 1.4415584415584415, "percentage": 72.08, "elapsed_time": "0:18:17", "remaining_time": "0:07:05"}
|
112 |
+
{"current_steps": 112, "total_steps": 154, "loss": 0.258, "lr": 8.734542494893955e-06, "epoch": 1.4545454545454546, "percentage": 72.73, "elapsed_time": "0:18:27", "remaining_time": "0:06:55"}
|
113 |
+
{"current_steps": 113, "total_steps": 154, "loss": 0.2061, "lr": 8.348171708068747e-06, "epoch": 1.4675324675324675, "percentage": 73.38, "elapsed_time": "0:18:36", "remaining_time": "0:06:45"}
|
114 |
+
{"current_steps": 114, "total_steps": 154, "loss": 0.2367, "lr": 7.968821348583644e-06, "epoch": 1.4805194805194806, "percentage": 74.03, "elapsed_time": "0:18:45", "remaining_time": "0:06:34"}
|
115 |
+
{"current_steps": 115, "total_steps": 154, "loss": 0.1913, "lr": 7.5966513509268365e-06, "epoch": 1.4935064935064934, "percentage": 74.68, "elapsed_time": "0:18:53", "remaining_time": "0:06:24"}
|
116 |
+
{"current_steps": 116, "total_steps": 154, "loss": 0.2311, "lr": 7.231818622338823e-06, "epoch": 1.5064935064935066, "percentage": 75.32, "elapsed_time": "0:19:02", "remaining_time": "0:06:14"}
|
117 |
+
{"current_steps": 117, "total_steps": 154, "loss": 0.2195, "lr": 6.8744769766601854e-06, "epoch": 1.5194805194805194, "percentage": 75.97, "elapsed_time": "0:19:11", "remaining_time": "0:06:04"}
|
118 |
+
{"current_steps": 118, "total_steps": 154, "loss": 0.21, "lr": 6.524777069483526e-06, "epoch": 1.5324675324675323, "percentage": 76.62, "elapsed_time": "0:19:20", "remaining_time": "0:05:54"}
|
119 |
+
{"current_steps": 119, "total_steps": 154, "loss": 0.1902, "lr": 6.182866334636889e-06, "epoch": 1.5454545454545454, "percentage": 77.27, "elapsed_time": "0:19:29", "remaining_time": "0:05:43"}
|
120 |
+
{"current_steps": 120, "total_steps": 154, "loss": 0.2293, "lr": 5.848888922025553e-06, "epoch": 1.5584415584415585, "percentage": 77.92, "elapsed_time": "0:19:38", "remaining_time": "0:05:33"}
|
121 |
+
{"current_steps": 121, "total_steps": 154, "loss": 0.227, "lr": 5.522985636858239e-06, "epoch": 1.5714285714285714, "percentage": 78.57, "elapsed_time": "0:19:46", "remaining_time": "0:05:23"}
|
122 |
+
{"current_steps": 122, "total_steps": 154, "loss": 0.1884, "lr": 5.205293880283552e-06, "epoch": 1.5844155844155843, "percentage": 79.22, "elapsed_time": "0:19:55", "remaining_time": "0:05:13"}
|
123 |
+
{"current_steps": 123, "total_steps": 154, "loss": 0.2241, "lr": 4.8959475914614554e-06, "epoch": 1.5974025974025974, "percentage": 79.87, "elapsed_time": "0:20:04", "remaining_time": "0:05:03"}
|
124 |
+
{"current_steps": 124, "total_steps": 154, "loss": 0.215, "lr": 4.5950771910944605e-06, "epoch": 1.6103896103896105, "percentage": 80.52, "elapsed_time": "0:20:13", "remaining_time": "0:04:53"}
|
125 |
+
{"current_steps": 125, "total_steps": 154, "loss": 0.2213, "lr": 4.3028095264420535e-06, "epoch": 1.6233766233766234, "percentage": 81.17, "elapsed_time": "0:20:22", "remaining_time": "0:04:43"}
|
126 |
+
{"current_steps": 126, "total_steps": 154, "loss": 0.2278, "lr": 4.019267817841835e-06, "epoch": 1.6363636363636362, "percentage": 81.82, "elapsed_time": "0:20:30", "remaining_time": "0:04:33"}
|
127 |
+
{"current_steps": 127, "total_steps": 154, "loss": 0.1999, "lr": 3.7445716067596503e-06, "epoch": 1.6493506493506493, "percentage": 82.47, "elapsed_time": "0:20:39", "remaining_time": "0:04:23"}
|
128 |
+
{"current_steps": 128, "total_steps": 154, "loss": 0.2341, "lr": 3.478836705390809e-06, "epoch": 1.6623376623376624, "percentage": 83.12, "elapsed_time": "0:20:48", "remaining_time": "0:04:13"}
|
129 |
+
{"current_steps": 129, "total_steps": 154, "loss": 0.2206, "lr": 3.222175147833556e-06, "epoch": 1.6753246753246753, "percentage": 83.77, "elapsed_time": "0:20:57", "remaining_time": "0:04:03"}
|
130 |
+
{"current_steps": 130, "total_steps": 154, "loss": 0.2408, "lr": 2.974695142855388e-06, "epoch": 1.6883116883116882, "percentage": 84.42, "elapsed_time": "0:21:06", "remaining_time": "0:03:53"}
|
131 |
+
{"current_steps": 131, "total_steps": 154, "loss": 0.2164, "lr": 2.7365010282720952e-06, "epoch": 1.7012987012987013, "percentage": 85.06, "elapsed_time": "0:21:15", "remaining_time": "0:03:43"}
|
132 |
+
{"current_steps": 132, "total_steps": 154, "loss": 0.2044, "lr": 2.507693226958871e-06, "epoch": 1.7142857142857144, "percentage": 85.71, "elapsed_time": "0:21:23", "remaining_time": "0:03:33"}
|
133 |
+
{"current_steps": 133, "total_steps": 154, "loss": 0.1979, "lr": 2.2883682045119063e-06, "epoch": 1.7272727272727273, "percentage": 86.36, "elapsed_time": "0:21:32", "remaining_time": "0:03:24"}
|
134 |
+
{"current_steps": 134, "total_steps": 154, "loss": 0.2124, "lr": 2.0786184285784297e-06, "epoch": 1.7402597402597402, "percentage": 87.01, "elapsed_time": "0:21:41", "remaining_time": "0:03:14"}
|
135 |
+
{"current_steps": 135, "total_steps": 154, "loss": 0.2435, "lr": 1.8785323298722097e-06, "epoch": 1.7532467532467533, "percentage": 87.66, "elapsed_time": "0:21:50", "remaining_time": "0:03:04"}
|
136 |
+
{"current_steps": 136, "total_steps": 154, "loss": 0.2092, "lr": 1.6881942648911076e-06, "epoch": 1.7662337662337664, "percentage": 88.31, "elapsed_time": "0:21:59", "remaining_time": "0:02:54"}
|
137 |
+
{"current_steps": 137, "total_steps": 154, "loss": 0.2117, "lr": 1.5076844803522922e-06, "epoch": 1.7792207792207793, "percentage": 88.96, "elapsed_time": "0:22:08", "remaining_time": "0:02:44"}
|
138 |
+
{"current_steps": 138, "total_steps": 154, "loss": 0.2325, "lr": 1.3370790793601373e-06, "epoch": 1.7922077922077921, "percentage": 89.61, "elapsed_time": "0:22:17", "remaining_time": "0:02:35"}
|
139 |
+
{"current_steps": 139, "total_steps": 154, "loss": 0.186, "lr": 1.1764499893210878e-06, "epoch": 1.8051948051948052, "percentage": 90.26, "elapsed_time": "0:22:25", "remaining_time": "0:02:25"}
|
140 |
+
{"current_steps": 140, "total_steps": 154, "loss": 0.1942, "lr": 1.0258649316189722e-06, "epoch": 1.8181818181818183, "percentage": 90.91, "elapsed_time": "0:22:34", "remaining_time": "0:02:15"}
|
141 |
+
{"current_steps": 141, "total_steps": 154, "loss": 0.2093, "lr": 8.85387393063622e-07, "epoch": 1.8311688311688312, "percentage": 91.56, "elapsed_time": "0:22:43", "remaining_time": "0:02:05"}
|
142 |
+
{"current_steps": 142, "total_steps": 154, "loss": 0.2134, "lr": 7.550765991247654e-07, "epoch": 1.844155844155844, "percentage": 92.21, "elapsed_time": "0:22:52", "remaining_time": "0:01:55"}
|
143 |
+
{"current_steps": 143, "total_steps": 154, "loss": 0.2068, "lr": 6.349874889624962e-07, "epoch": 1.8571428571428572, "percentage": 92.86, "elapsed_time": "0:23:01", "remaining_time": "0:01:46"}
|
144 |
+
{"current_steps": 144, "total_steps": 154, "loss": 0.2025, "lr": 5.25170692264887e-07, "epoch": 1.87012987012987, "percentage": 93.51, "elapsed_time": "0:23:09", "remaining_time": "0:01:36"}
|
145 |
+
{"current_steps": 145, "total_steps": 154, "loss": 0.2288, "lr": 4.256725079024554e-07, "epoch": 1.883116883116883, "percentage": 94.16, "elapsed_time": "0:23:18", "remaining_time": "0:01:26"}
|
146 |
+
{"current_steps": 146, "total_steps": 154, "loss": 0.2264, "lr": 3.3653488440851255e-07, "epoch": 1.896103896103896, "percentage": 94.81, "elapsed_time": "0:23:27", "remaining_time": "0:01:17"}
|
147 |
+
{"current_steps": 147, "total_steps": 154, "loss": 0.211, "lr": 2.5779540229361745e-07, "epoch": 1.9090909090909092, "percentage": 95.45, "elapsed_time": "0:23:36", "remaining_time": "0:01:07"}
|
148 |
+
{"current_steps": 148, "total_steps": 154, "loss": 0.2003, "lr": 1.8948725820160662e-07, "epoch": 1.922077922077922, "percentage": 96.1, "elapsed_time": "0:23:45", "remaining_time": "0:00:57"}
|
149 |
+
{"current_steps": 149, "total_steps": 154, "loss": 0.2245, "lr": 1.3163925091384533e-07, "epoch": 1.935064935064935, "percentage": 96.75, "elapsed_time": "0:23:54", "remaining_time": "0:00:48"}
|
150 |
+
{"current_steps": 150, "total_steps": 154, "loss": 0.1908, "lr": 8.427576920763958e-08, "epoch": 1.948051948051948, "percentage": 97.4, "elapsed_time": "0:24:02", "remaining_time": "0:00:38"}
|
151 |
+
{"current_steps": 151, "total_steps": 154, "loss": 0.1992, "lr": 4.741678157389739e-08, "epoch": 1.9610389610389611, "percentage": 98.05, "elapsed_time": "0:25:08", "remaining_time": "0:00:29"}
|
152 |
+
{"current_steps": 152, "total_steps": 154, "loss": 0.2069, "lr": 2.1077827798404726e-08, "epoch": 1.974025974025974, "percentage": 98.7, "elapsed_time": "0:25:17", "remaining_time": "0:00:19"}
|
153 |
+
{"current_steps": 153, "total_steps": 154, "loss": 0.1865, "lr": 5.270012410216185e-09, "epoch": 1.987012987012987, "percentage": 99.35, "elapsed_time": "0:25:25", "remaining_time": "0:00:09"}
|
154 |
+
{"current_steps": 154, "total_steps": 154, "loss": 0.1957, "lr": 0.0, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:25:34", "remaining_time": "0:00:00"}
|