Model save
Browse files- .gitattributes +1 -0
- all_results.json +3 -3
- eval_nbest_predictions.json +3 -0
- eval_predictions.json +0 -0
- model.safetensors +1 -1
- train_results.json +3 -3
- trainer_state.json +3 -3
- training_args.bin +1 -1
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
eval_nbest_predictions.json filter=lfs diff=lfs merge=lfs -text
|
all_results.json
CHANGED
@@ -2,8 +2,8 @@
|
|
2 |
"epoch": 2.0,
|
3 |
"total_flos": 1.1159654864928768e+16,
|
4 |
"train_loss": 1.1755467142439282,
|
5 |
-
"train_runtime":
|
6 |
"train_samples": 397452,
|
7 |
-
"train_samples_per_second": 93.
|
8 |
-
"train_steps_per_second": 7.
|
9 |
}
|
|
|
2 |
"epoch": 2.0,
|
3 |
"total_flos": 1.1159654864928768e+16,
|
4 |
"train_loss": 1.1755467142439282,
|
5 |
+
"train_runtime": 8474.7112,
|
6 |
"train_samples": 397452,
|
7 |
+
"train_samples_per_second": 93.797,
|
8 |
+
"train_steps_per_second": 7.816
|
9 |
}
|
eval_nbest_predictions.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43df2980f28317698aa7d359fba8cfe5d0fa0bd2cf6fbe326ea72712d5de9945
|
3 |
+
size 58166149
|
eval_predictions.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 55116544
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bc0080772daa24c2c0813317ba1bbeb1ce5ead68d5fa69b4fce7dbb72b63124
|
3 |
size 55116544
|
train_results.json
CHANGED
@@ -2,8 +2,8 @@
|
|
2 |
"epoch": 2.0,
|
3 |
"total_flos": 1.1159654864928768e+16,
|
4 |
"train_loss": 1.1755467142439282,
|
5 |
-
"train_runtime":
|
6 |
"train_samples": 397452,
|
7 |
-
"train_samples_per_second": 93.
|
8 |
-
"train_steps_per_second": 7.
|
9 |
}
|
|
|
2 |
"epoch": 2.0,
|
3 |
"total_flos": 1.1159654864928768e+16,
|
4 |
"train_loss": 1.1755467142439282,
|
5 |
+
"train_runtime": 8474.7112,
|
6 |
"train_samples": 397452,
|
7 |
+
"train_samples_per_second": 93.797,
|
8 |
+
"train_steps_per_second": 7.816
|
9 |
}
|
trainer_state.json
CHANGED
@@ -938,9 +938,9 @@
|
|
938 |
"step": 66242,
|
939 |
"total_flos": 1.1159654864928768e+16,
|
940 |
"train_loss": 1.1755467142439282,
|
941 |
-
"train_runtime":
|
942 |
-
"train_samples_per_second": 93.
|
943 |
-
"train_steps_per_second": 7.
|
944 |
}
|
945 |
],
|
946 |
"logging_steps": 500,
|
|
|
938 |
"step": 66242,
|
939 |
"total_flos": 1.1159654864928768e+16,
|
940 |
"train_loss": 1.1755467142439282,
|
941 |
+
"train_runtime": 8474.7112,
|
942 |
+
"train_samples_per_second": 93.797,
|
943 |
+
"train_steps_per_second": 7.816
|
944 |
}
|
945 |
],
|
946 |
"logging_steps": 500,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5841
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a4d6e0968cd9abe3be1e33382614c9d48f9f2c41ca39ab0fa6865c4a161882d
|
3 |
size 5841
|