Training in progress, step 100
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +50 -0
adapter_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 828527688
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e3c97d77d8592284aa0a04cbdf994e812a84ce900c025924d69a7f980c3edc4
|
3 |
size 828527688
|
trainer_log.jsonl
CHANGED
@@ -52,3 +52,53 @@
|
|
52 |
{"current_steps": 52, "total_steps": 154, "loss": 0.2322, "lr": 3.7500000000000003e-05, "epoch": 0.6753246753246753, "percentage": 33.77, "elapsed_time": "0:08:41", "remaining_time": "0:17:02"}
|
53 |
{"current_steps": 53, "total_steps": 154, "loss": 0.2551, "lr": 3.705283756425872e-05, "epoch": 0.6883116883116883, "percentage": 34.42, "elapsed_time": "0:08:50", "remaining_time": "0:16:50"}
|
54 |
{"current_steps": 54, "total_steps": 154, "loss": 0.2463, "lr": 3.6600593640234086e-05, "epoch": 0.7012987012987013, "percentage": 35.06, "elapsed_time": "0:08:58", "remaining_time": "0:16:37"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
52 |
{"current_steps": 52, "total_steps": 154, "loss": 0.2322, "lr": 3.7500000000000003e-05, "epoch": 0.6753246753246753, "percentage": 33.77, "elapsed_time": "0:08:41", "remaining_time": "0:17:02"}
|
53 |
{"current_steps": 53, "total_steps": 154, "loss": 0.2551, "lr": 3.705283756425872e-05, "epoch": 0.6883116883116883, "percentage": 34.42, "elapsed_time": "0:08:50", "remaining_time": "0:16:50"}
|
54 |
{"current_steps": 54, "total_steps": 154, "loss": 0.2463, "lr": 3.6600593640234086e-05, "epoch": 0.7012987012987013, "percentage": 35.06, "elapsed_time": "0:08:58", "remaining_time": "0:16:37"}
|
55 |
+
{"current_steps": 55, "total_steps": 154, "loss": 0.2484, "lr": 3.6143458894413465e-05, "epoch": 0.7142857142857143, "percentage": 35.71, "elapsed_time": "0:09:07", "remaining_time": "0:16:25"}
|
56 |
+
{"current_steps": 56, "total_steps": 154, "loss": 0.2468, "lr": 3.568162605525953e-05, "epoch": 0.7272727272727273, "percentage": 36.36, "elapsed_time": "0:09:16", "remaining_time": "0:16:13"}
|
57 |
+
{"current_steps": 57, "total_steps": 154, "loss": 0.2516, "lr": 3.5215289831955786e-05, "epoch": 0.7402597402597403, "percentage": 37.01, "elapsed_time": "0:09:24", "remaining_time": "0:16:01"}
|
58 |
+
{"current_steps": 58, "total_steps": 154, "loss": 0.2236, "lr": 3.474464683231698e-05, "epoch": 0.7532467532467533, "percentage": 37.66, "elapsed_time": "0:09:33", "remaining_time": "0:15:49"}
|
59 |
+
{"current_steps": 59, "total_steps": 154, "loss": 0.2525, "lr": 3.426989547989902e-05, "epoch": 0.7662337662337663, "percentage": 38.31, "elapsed_time": "0:09:42", "remaining_time": "0:15:38"}
|
60 |
+
{"current_steps": 60, "total_steps": 154, "loss": 0.2246, "lr": 3.379123593034342e-05, "epoch": 0.7792207792207793, "percentage": 38.96, "elapsed_time": "0:09:51", "remaining_time": "0:15:26"}
|
61 |
+
{"current_steps": 61, "total_steps": 154, "loss": 0.2282, "lr": 3.330886998699149e-05, "epoch": 0.7922077922077922, "percentage": 39.61, "elapsed_time": "0:10:00", "remaining_time": "0:15:15"}
|
62 |
+
{"current_steps": 62, "total_steps": 154, "loss": 0.24, "lr": 3.282300101580386e-05, "epoch": 0.8051948051948052, "percentage": 40.26, "elapsed_time": "0:10:08", "remaining_time": "0:15:03"}
|
63 |
+
{"current_steps": 63, "total_steps": 154, "loss": 0.2167, "lr": 3.2333833859621153e-05, "epoch": 0.8181818181818182, "percentage": 40.91, "elapsed_time": "0:10:17", "remaining_time": "0:14:52"}
|
64 |
+
{"current_steps": 64, "total_steps": 154, "loss": 0.237, "lr": 3.1841574751802076e-05, "epoch": 0.8311688311688312, "percentage": 41.56, "elapsed_time": "0:10:26", "remaining_time": "0:14:41"}
|
65 |
+
{"current_steps": 65, "total_steps": 154, "loss": 0.2245, "lr": 3.13464312292752e-05, "epoch": 0.8441558441558441, "percentage": 42.21, "elapsed_time": "0:10:35", "remaining_time": "0:14:30"}
|
66 |
+
{"current_steps": 66, "total_steps": 154, "loss": 0.223, "lr": 3.084861204504122e-05, "epoch": 0.8571428571428571, "percentage": 42.86, "elapsed_time": "0:10:43", "remaining_time": "0:14:18"}
|
67 |
+
{"current_steps": 67, "total_steps": 154, "loss": 0.2461, "lr": 3.0348327080162435e-05, "epoch": 0.8701298701298701, "percentage": 43.51, "elapsed_time": "0:10:52", "remaining_time": "0:14:07"}
|
68 |
+
{"current_steps": 68, "total_steps": 154, "loss": 0.2315, "lr": 2.9845787255276753e-05, "epoch": 0.8831168831168831, "percentage": 44.16, "elapsed_time": "0:11:01", "remaining_time": "0:13:56"}
|
69 |
+
{"current_steps": 69, "total_steps": 154, "loss": 0.2191, "lr": 2.9341204441673266e-05, "epoch": 0.8961038961038961, "percentage": 44.81, "elapsed_time": "0:11:10", "remaining_time": "0:13:45"}
|
70 |
+
{"current_steps": 70, "total_steps": 154, "loss": 0.2466, "lr": 2.8834791371967142e-05, "epoch": 0.9090909090909091, "percentage": 45.45, "elapsed_time": "0:11:19", "remaining_time": "0:13:35"}
|
71 |
+
{"current_steps": 71, "total_steps": 154, "loss": 0.2376, "lr": 2.8326761550411345e-05, "epoch": 0.922077922077922, "percentage": 46.1, "elapsed_time": "0:11:28", "remaining_time": "0:13:24"}
|
72 |
+
{"current_steps": 72, "total_steps": 154, "loss": 0.2404, "lr": 2.781732916288303e-05, "epoch": 0.935064935064935, "percentage": 46.75, "elapsed_time": "0:11:36", "remaining_time": "0:13:13"}
|
73 |
+
{"current_steps": 73, "total_steps": 154, "loss": 0.259, "lr": 2.7306708986582553e-05, "epoch": 0.948051948051948, "percentage": 47.4, "elapsed_time": "0:11:45", "remaining_time": "0:13:02"}
|
74 |
+
{"current_steps": 74, "total_steps": 154, "loss": 0.2438, "lr": 2.679511629948319e-05, "epoch": 0.961038961038961, "percentage": 48.05, "elapsed_time": "0:11:54", "remaining_time": "0:12:52"}
|
75 |
+
{"current_steps": 75, "total_steps": 154, "loss": 0.2442, "lr": 2.628276678956974e-05, "epoch": 0.974025974025974, "percentage": 48.7, "elapsed_time": "0:12:03", "remaining_time": "0:12:41"}
|
76 |
+
{"current_steps": 76, "total_steps": 154, "loss": 0.2366, "lr": 2.5769876463904265e-05, "epoch": 0.987012987012987, "percentage": 49.35, "elapsed_time": "0:12:11", "remaining_time": "0:12:31"}
|
77 |
+
{"current_steps": 77, "total_steps": 154, "loss": 0.238, "lr": 2.5256661557557247e-05, "epoch": 1.0, "percentage": 50.0, "elapsed_time": "0:12:20", "remaining_time": "0:12:20"}
|
78 |
+
{"current_steps": 78, "total_steps": 154, "loss": 0.2335, "lr": 2.4743338442442755e-05, "epoch": 1.0129870129870129, "percentage": 50.65, "elapsed_time": "0:12:29", "remaining_time": "0:12:10"}
|
79 |
+
{"current_steps": 79, "total_steps": 154, "loss": 0.245, "lr": 2.4230123536095748e-05, "epoch": 1.025974025974026, "percentage": 51.3, "elapsed_time": "0:12:38", "remaining_time": "0:11:59"}
|
80 |
+
{"current_steps": 80, "total_steps": 154, "loss": 0.2213, "lr": 2.3717233210430256e-05, "epoch": 1.0389610389610389, "percentage": 51.95, "elapsed_time": "0:12:47", "remaining_time": "0:11:49"}
|
81 |
+
{"current_steps": 81, "total_steps": 154, "loss": 0.2353, "lr": 2.3204883700516812e-05, "epoch": 1.051948051948052, "percentage": 52.6, "elapsed_time": "0:12:56", "remaining_time": "0:11:39"}
|
82 |
+
{"current_steps": 82, "total_steps": 154, "loss": 0.2266, "lr": 2.2693291013417453e-05, "epoch": 1.0649350649350648, "percentage": 53.25, "elapsed_time": "0:13:04", "remaining_time": "0:11:29"}
|
83 |
+
{"current_steps": 83, "total_steps": 154, "loss": 0.2503, "lr": 2.2182670837116975e-05, "epoch": 1.077922077922078, "percentage": 53.9, "elapsed_time": "0:13:13", "remaining_time": "0:11:18"}
|
84 |
+
{"current_steps": 84, "total_steps": 154, "loss": 0.2464, "lr": 2.1673238449588668e-05, "epoch": 1.0909090909090908, "percentage": 54.55, "elapsed_time": "0:13:22", "remaining_time": "0:11:08"}
|
85 |
+
{"current_steps": 85, "total_steps": 154, "loss": 0.2075, "lr": 2.116520862803286e-05, "epoch": 1.103896103896104, "percentage": 55.19, "elapsed_time": "0:13:31", "remaining_time": "0:10:58"}
|
86 |
+
{"current_steps": 86, "total_steps": 154, "loss": 0.2021, "lr": 2.0658795558326743e-05, "epoch": 1.1168831168831168, "percentage": 55.84, "elapsed_time": "0:13:40", "remaining_time": "0:10:48"}
|
87 |
+
{"current_steps": 87, "total_steps": 154, "loss": 0.2033, "lr": 2.015421274472325e-05, "epoch": 1.12987012987013, "percentage": 56.49, "elapsed_time": "0:13:48", "remaining_time": "0:10:38"}
|
88 |
+
{"current_steps": 88, "total_steps": 154, "loss": 0.2109, "lr": 1.965167291983757e-05, "epoch": 1.1428571428571428, "percentage": 57.14, "elapsed_time": "0:13:57", "remaining_time": "0:10:28"}
|
89 |
+
{"current_steps": 89, "total_steps": 154, "loss": 0.2073, "lr": 1.9151387954958794e-05, "epoch": 1.155844155844156, "percentage": 57.79, "elapsed_time": "0:14:06", "remaining_time": "0:10:18"}
|
90 |
+
{"current_steps": 90, "total_steps": 154, "loss": 0.2126, "lr": 1.8653568770724806e-05, "epoch": 1.1688311688311688, "percentage": 58.44, "elapsed_time": "0:14:15", "remaining_time": "0:10:08"}
|
91 |
+
{"current_steps": 91, "total_steps": 154, "loss": 0.199, "lr": 1.815842524819793e-05, "epoch": 1.1818181818181819, "percentage": 59.09, "elapsed_time": "0:14:24", "remaining_time": "0:09:58"}
|
92 |
+
{"current_steps": 92, "total_steps": 154, "loss": 0.209, "lr": 1.7666166140378852e-05, "epoch": 1.1948051948051948, "percentage": 59.74, "elapsed_time": "0:14:32", "remaining_time": "0:09:48"}
|
93 |
+
{"current_steps": 93, "total_steps": 154, "loss": 0.2111, "lr": 1.7176998984196146e-05, "epoch": 1.2077922077922079, "percentage": 60.39, "elapsed_time": "0:14:41", "remaining_time": "0:09:38"}
|
94 |
+
{"current_steps": 94, "total_steps": 154, "loss": 0.2169, "lr": 1.6691130013008514e-05, "epoch": 1.2207792207792207, "percentage": 61.04, "elapsed_time": "0:14:50", "remaining_time": "0:09:28"}
|
95 |
+
{"current_steps": 95, "total_steps": 154, "loss": 0.2156, "lr": 1.620876406965658e-05, "epoch": 1.2337662337662338, "percentage": 61.69, "elapsed_time": "0:14:59", "remaining_time": "0:09:18"}
|
96 |
+
{"current_steps": 96, "total_steps": 154, "loss": 0.2373, "lr": 1.5730104520100982e-05, "epoch": 1.2467532467532467, "percentage": 62.34, "elapsed_time": "0:15:08", "remaining_time": "0:09:08"}
|
97 |
+
{"current_steps": 97, "total_steps": 154, "loss": 0.2301, "lr": 1.5255353167683017e-05, "epoch": 1.2597402597402598, "percentage": 62.99, "elapsed_time": "0:15:17", "remaining_time": "0:08:58"}
|
98 |
+
{"current_steps": 98, "total_steps": 154, "loss": 0.2418, "lr": 1.4784710168044213e-05, "epoch": 1.2727272727272727, "percentage": 63.64, "elapsed_time": "0:15:25", "remaining_time": "0:08:49"}
|
99 |
+
{"current_steps": 99, "total_steps": 154, "loss": 0.2008, "lr": 1.4318373944740484e-05, "epoch": 1.2857142857142856, "percentage": 64.29, "elapsed_time": "0:15:34", "remaining_time": "0:08:39"}
|
100 |
+
{"current_steps": 100, "total_steps": 154, "loss": 0.2071, "lr": 1.3856541105586545e-05, "epoch": 1.2987012987012987, "percentage": 64.94, "elapsed_time": "0:15:43", "remaining_time": "0:08:29"}
|
101 |
+
{"current_steps": 101, "total_steps": 154, "loss": 0.2028, "lr": 1.339940635976592e-05, "epoch": 1.3116883116883118, "percentage": 65.58, "elapsed_time": "0:16:50", "remaining_time": "0:08:50"}
|
102 |
+
{"current_steps": 102, "total_steps": 154, "loss": 0.2465, "lr": 1.2947162435741278e-05, "epoch": 1.3246753246753247, "percentage": 66.23, "elapsed_time": "0:16:58", "remaining_time": "0:08:39"}
|
103 |
+
{"current_steps": 103, "total_steps": 154, "loss": 0.2241, "lr": 1.2500000000000006e-05, "epoch": 1.3376623376623376, "percentage": 66.88, "elapsed_time": "0:17:07", "remaining_time": "0:08:28"}
|
104 |
+
{"current_steps": 104, "total_steps": 154, "loss": 0.2248, "lr": 1.205810757666894e-05, "epoch": 1.3506493506493507, "percentage": 67.53, "elapsed_time": "0:17:16", "remaining_time": "0:08:18"}
|