Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0e55a6c1e132c09a7d5ea6b6da84500b3c9732a3dcf525cd8dac447d37fd1004
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d195fd3af925f949d024df10b5806196a6b9b18ec47751bbfed572443097327
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f7af3e1af00e3492d9e5486ee02b5176a9cab95af4db94a5761037858fd01fa
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8aa18327f7c95a2c8e8977f6975685a6703863f4b0b91bba74fe074324f00649
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -67,3 +67,36 @@
|
|
67 |
{"current_steps": 660, "total_steps": 1005, "loss": 0.7386, "lr": 5e-06, "epoch": 1.9701492537313432, "percentage": 65.67, "elapsed_time": "10:41:09", "remaining_time": "5:35:09"}
|
68 |
{"current_steps": 670, "total_steps": 1005, "loss": 0.7335, "lr": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "10:50:44", "remaining_time": "5:25:22"}
|
69 |
{"current_steps": 670, "total_steps": 1005, "eval_loss": 0.7694990634918213, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "10:56:42", "remaining_time": "5:28:21"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
67 |
{"current_steps": 660, "total_steps": 1005, "loss": 0.7386, "lr": 5e-06, "epoch": 1.9701492537313432, "percentage": 65.67, "elapsed_time": "10:41:09", "remaining_time": "5:35:09"}
|
68 |
{"current_steps": 670, "total_steps": 1005, "loss": 0.7335, "lr": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "10:50:44", "remaining_time": "5:25:22"}
|
69 |
{"current_steps": 670, "total_steps": 1005, "eval_loss": 0.7694990634918213, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "10:56:42", "remaining_time": "5:28:21"}
|
70 |
+
{"current_steps": 680, "total_steps": 1005, "loss": 0.6893, "lr": 5e-06, "epoch": 2.029850746268657, "percentage": 67.66, "elapsed_time": "11:07:33", "remaining_time": "5:19:03"}
|
71 |
+
{"current_steps": 690, "total_steps": 1005, "loss": 0.6913, "lr": 5e-06, "epoch": 2.0597014925373136, "percentage": 68.66, "elapsed_time": "11:17:11", "remaining_time": "5:09:09"}
|
72 |
+
{"current_steps": 700, "total_steps": 1005, "loss": 0.6895, "lr": 5e-06, "epoch": 2.08955223880597, "percentage": 69.65, "elapsed_time": "11:26:51", "remaining_time": "4:59:16"}
|
73 |
+
{"current_steps": 710, "total_steps": 1005, "loss": 0.6916, "lr": 5e-06, "epoch": 2.1194029850746268, "percentage": 70.65, "elapsed_time": "11:36:29", "remaining_time": "4:49:23"}
|
74 |
+
{"current_steps": 720, "total_steps": 1005, "loss": 0.6935, "lr": 5e-06, "epoch": 2.1492537313432836, "percentage": 71.64, "elapsed_time": "11:46:08", "remaining_time": "4:39:31"}
|
75 |
+
{"current_steps": 730, "total_steps": 1005, "loss": 0.6951, "lr": 5e-06, "epoch": 2.1791044776119404, "percentage": 72.64, "elapsed_time": "11:55:45", "remaining_time": "4:29:38"}
|
76 |
+
{"current_steps": 740, "total_steps": 1005, "loss": 0.6904, "lr": 5e-06, "epoch": 2.208955223880597, "percentage": 73.63, "elapsed_time": "12:05:23", "remaining_time": "4:19:46"}
|
77 |
+
{"current_steps": 750, "total_steps": 1005, "loss": 0.6935, "lr": 5e-06, "epoch": 2.2388059701492535, "percentage": 74.63, "elapsed_time": "12:15:00", "remaining_time": "4:09:54"}
|
78 |
+
{"current_steps": 760, "total_steps": 1005, "loss": 0.6985, "lr": 5e-06, "epoch": 2.2686567164179103, "percentage": 75.62, "elapsed_time": "12:24:38", "remaining_time": "4:00:02"}
|
79 |
+
{"current_steps": 770, "total_steps": 1005, "loss": 0.6989, "lr": 5e-06, "epoch": 2.298507462686567, "percentage": 76.62, "elapsed_time": "12:34:15", "remaining_time": "3:50:11"}
|
80 |
+
{"current_steps": 780, "total_steps": 1005, "loss": 0.6993, "lr": 5e-06, "epoch": 2.328358208955224, "percentage": 77.61, "elapsed_time": "12:43:55", "remaining_time": "3:40:21"}
|
81 |
+
{"current_steps": 790, "total_steps": 1005, "loss": 0.6946, "lr": 5e-06, "epoch": 2.3582089552238807, "percentage": 78.61, "elapsed_time": "12:53:33", "remaining_time": "3:30:31"}
|
82 |
+
{"current_steps": 800, "total_steps": 1005, "loss": 0.6962, "lr": 5e-06, "epoch": 2.388059701492537, "percentage": 79.6, "elapsed_time": "13:03:12", "remaining_time": "3:20:41"}
|
83 |
+
{"current_steps": 810, "total_steps": 1005, "loss": 0.6953, "lr": 5e-06, "epoch": 2.417910447761194, "percentage": 80.6, "elapsed_time": "13:12:51", "remaining_time": "3:10:52"}
|
84 |
+
{"current_steps": 820, "total_steps": 1005, "loss": 0.6931, "lr": 5e-06, "epoch": 2.4477611940298507, "percentage": 81.59, "elapsed_time": "13:22:28", "remaining_time": "3:01:02"}
|
85 |
+
{"current_steps": 830, "total_steps": 1005, "loss": 0.6955, "lr": 5e-06, "epoch": 2.4776119402985075, "percentage": 82.59, "elapsed_time": "13:32:04", "remaining_time": "2:51:13"}
|
86 |
+
{"current_steps": 840, "total_steps": 1005, "loss": 0.6933, "lr": 5e-06, "epoch": 2.5074626865671643, "percentage": 83.58, "elapsed_time": "13:41:40", "remaining_time": "2:41:24"}
|
87 |
+
{"current_steps": 850, "total_steps": 1005, "loss": 0.6945, "lr": 5e-06, "epoch": 2.5373134328358207, "percentage": 84.58, "elapsed_time": "13:51:17", "remaining_time": "2:31:35"}
|
88 |
+
{"current_steps": 860, "total_steps": 1005, "loss": 0.6983, "lr": 5e-06, "epoch": 2.5671641791044775, "percentage": 85.57, "elapsed_time": "14:00:53", "remaining_time": "2:21:46"}
|
89 |
+
{"current_steps": 870, "total_steps": 1005, "loss": 0.6986, "lr": 5e-06, "epoch": 2.5970149253731343, "percentage": 86.57, "elapsed_time": "14:10:31", "remaining_time": "2:11:58"}
|
90 |
+
{"current_steps": 880, "total_steps": 1005, "loss": 0.6992, "lr": 5e-06, "epoch": 2.626865671641791, "percentage": 87.56, "elapsed_time": "14:20:08", "remaining_time": "2:02:10"}
|
91 |
+
{"current_steps": 890, "total_steps": 1005, "loss": 0.697, "lr": 5e-06, "epoch": 2.656716417910448, "percentage": 88.56, "elapsed_time": "14:29:44", "remaining_time": "1:52:22"}
|
92 |
+
{"current_steps": 900, "total_steps": 1005, "loss": 0.697, "lr": 5e-06, "epoch": 2.6865671641791042, "percentage": 89.55, "elapsed_time": "14:39:21", "remaining_time": "1:42:35"}
|
93 |
+
{"current_steps": 910, "total_steps": 1005, "loss": 0.6926, "lr": 5e-06, "epoch": 2.716417910447761, "percentage": 90.55, "elapsed_time": "14:48:58", "remaining_time": "1:32:48"}
|
94 |
+
{"current_steps": 920, "total_steps": 1005, "loss": 0.6954, "lr": 5e-06, "epoch": 2.746268656716418, "percentage": 91.54, "elapsed_time": "14:58:32", "remaining_time": "1:23:01"}
|
95 |
+
{"current_steps": 930, "total_steps": 1005, "loss": 0.6992, "lr": 5e-06, "epoch": 2.7761194029850746, "percentage": 92.54, "elapsed_time": "15:08:08", "remaining_time": "1:13:14"}
|
96 |
+
{"current_steps": 940, "total_steps": 1005, "loss": 0.6946, "lr": 5e-06, "epoch": 2.8059701492537314, "percentage": 93.53, "elapsed_time": "15:17:44", "remaining_time": "1:03:27"}
|
97 |
+
{"current_steps": 950, "total_steps": 1005, "loss": 0.6954, "lr": 5e-06, "epoch": 2.835820895522388, "percentage": 94.53, "elapsed_time": "15:27:19", "remaining_time": "0:53:41"}
|
98 |
+
{"current_steps": 960, "total_steps": 1005, "loss": 0.6991, "lr": 5e-06, "epoch": 2.8656716417910446, "percentage": 95.52, "elapsed_time": "15:36:56", "remaining_time": "0:43:55"}
|
99 |
+
{"current_steps": 970, "total_steps": 1005, "loss": 0.6988, "lr": 5e-06, "epoch": 2.8955223880597014, "percentage": 96.52, "elapsed_time": "15:46:33", "remaining_time": "0:34:09"}
|
100 |
+
{"current_steps": 980, "total_steps": 1005, "loss": 0.6985, "lr": 5e-06, "epoch": 2.925373134328358, "percentage": 97.51, "elapsed_time": "15:56:09", "remaining_time": "0:24:23"}
|
101 |
+
{"current_steps": 990, "total_steps": 1005, "loss": 0.6957, "lr": 5e-06, "epoch": 2.955223880597015, "percentage": 98.51, "elapsed_time": "16:05:45", "remaining_time": "0:14:37"}
|
102 |
+
{"current_steps": 1000, "total_steps": 1005, "loss": 0.6979, "lr": 5e-06, "epoch": 2.9850746268656714, "percentage": 99.5, "elapsed_time": "16:15:22", "remaining_time": "0:04:52"}
|