Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4976698672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b347e7656cb3329f1dc5e252d10969d8d91dfd1b39d67fa706d556dfef2ea944
|
3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4999802720
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8441a81ae53f602927f7cc608cf5b60828ff51f0385a143c17f83e7ea3067376
|
3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4915916176
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:143536cdbd9e21bf79fd7363820d31539be7987f0cd3e89115bd517327646db8
|
3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1168138808
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c5808ddd16216fde11bb479bb5862fc7182bf6b4e6da37e968d6a28a23832e8
|
3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
@@ -10,3 +10,15 @@
|
|
10 |
{"current_steps": 100, "total_steps": 330, "loss": 0.594, "learning_rate": 5e-06, "epoch": 0.903954802259887, "percentage": 30.3, "elapsed_time": "0:51:30", "remaining_time": "1:58:28"}
|
11 |
{"current_steps": 110, "total_steps": 330, "loss": 0.5971, "learning_rate": 5e-06, "epoch": 0.9943502824858758, "percentage": 33.33, "elapsed_time": "0:56:38", "remaining_time": "1:53:17"}
|
12 |
{"current_steps": 110, "total_steps": 330, "eval_loss": 0.593043327331543, "epoch": 0.9943502824858758, "percentage": 33.33, "elapsed_time": "0:58:13", "remaining_time": "1:56:27"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10 |
{"current_steps": 100, "total_steps": 330, "loss": 0.594, "learning_rate": 5e-06, "epoch": 0.903954802259887, "percentage": 30.3, "elapsed_time": "0:51:30", "remaining_time": "1:58:28"}
|
11 |
{"current_steps": 110, "total_steps": 330, "loss": 0.5971, "learning_rate": 5e-06, "epoch": 0.9943502824858758, "percentage": 33.33, "elapsed_time": "0:56:38", "remaining_time": "1:53:17"}
|
12 |
{"current_steps": 110, "total_steps": 330, "eval_loss": 0.593043327331543, "epoch": 0.9943502824858758, "percentage": 33.33, "elapsed_time": "0:58:13", "remaining_time": "1:56:27"}
|
13 |
+
{"current_steps": 120, "total_steps": 330, "loss": 0.5786, "learning_rate": 5e-06, "epoch": 1.0847457627118644, "percentage": 36.36, "elapsed_time": "1:04:15", "remaining_time": "1:52:26"}
|
14 |
+
{"current_steps": 130, "total_steps": 330, "loss": 0.5597, "learning_rate": 5e-06, "epoch": 1.1751412429378532, "percentage": 39.39, "elapsed_time": "1:09:22", "remaining_time": "1:46:44"}
|
15 |
+
{"current_steps": 140, "total_steps": 330, "loss": 0.556, "learning_rate": 5e-06, "epoch": 1.2655367231638417, "percentage": 42.42, "elapsed_time": "1:14:30", "remaining_time": "1:41:07"}
|
16 |
+
{"current_steps": 150, "total_steps": 330, "loss": 0.5637, "learning_rate": 5e-06, "epoch": 1.3559322033898304, "percentage": 45.45, "elapsed_time": "1:19:38", "remaining_time": "1:35:34"}
|
17 |
+
{"current_steps": 160, "total_steps": 330, "loss": 0.5552, "learning_rate": 5e-06, "epoch": 1.4463276836158192, "percentage": 48.48, "elapsed_time": "1:24:45", "remaining_time": "1:30:02"}
|
18 |
+
{"current_steps": 170, "total_steps": 330, "loss": 0.557, "learning_rate": 5e-06, "epoch": 1.536723163841808, "percentage": 51.52, "elapsed_time": "1:29:52", "remaining_time": "1:24:35"}
|
19 |
+
{"current_steps": 180, "total_steps": 330, "loss": 0.5561, "learning_rate": 5e-06, "epoch": 1.6271186440677967, "percentage": 54.55, "elapsed_time": "1:35:01", "remaining_time": "1:19:10"}
|
20 |
+
{"current_steps": 190, "total_steps": 330, "loss": 0.5583, "learning_rate": 5e-06, "epoch": 1.7175141242937855, "percentage": 57.58, "elapsed_time": "1:40:09", "remaining_time": "1:13:48"}
|
21 |
+
{"current_steps": 200, "total_steps": 330, "loss": 0.5572, "learning_rate": 5e-06, "epoch": 1.807909604519774, "percentage": 60.61, "elapsed_time": "1:45:19", "remaining_time": "1:08:27"}
|
22 |
+
{"current_steps": 210, "total_steps": 330, "loss": 0.5549, "learning_rate": 5e-06, "epoch": 1.8983050847457628, "percentage": 63.64, "elapsed_time": "1:50:29", "remaining_time": "1:03:08"}
|
23 |
+
{"current_steps": 220, "total_steps": 330, "loss": 0.5574, "learning_rate": 5e-06, "epoch": 1.9887005649717513, "percentage": 66.67, "elapsed_time": "1:55:38", "remaining_time": "0:57:49"}
|
24 |
+
{"current_steps": 221, "total_steps": 330, "eval_loss": 0.580794095993042, "epoch": 1.9977401129943502, "percentage": 66.97, "elapsed_time": "1:57:27", "remaining_time": "0:57:55"}
|