jonathanagustin
commited on
Commit
•
4548d44
1
Parent(s):
a9eb5ca
Training in progress, step 1100
Browse files- pytorch_model.bin +1 -1
- tokenizer.json +3 -5
- trainer_state.json +6 -6
- training_args.bin +1 -1
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 265493026
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6adc9954515c2a6c8270a1f55a43bdcd35c3c879a458287434024777b2c6983
|
3 |
size 265493026
|
tokenizer.json
CHANGED
@@ -3,13 +3,11 @@
|
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
"max_length": 512,
|
6 |
-
"strategy": "
|
7 |
-
"stride":
|
8 |
},
|
9 |
"padding": {
|
10 |
-
"strategy":
|
11 |
-
"Fixed": 512
|
12 |
-
},
|
13 |
"direction": "Right",
|
14 |
"pad_to_multiple_of": null,
|
15 |
"pad_id": 0,
|
|
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
"max_length": 512,
|
6 |
+
"strategy": "OnlySecond",
|
7 |
+
"stride": 128
|
8 |
},
|
9 |
"padding": {
|
10 |
+
"strategy": "BatchLongest",
|
|
|
|
|
11 |
"direction": "Right",
|
12 |
"pad_to_multiple_of": null,
|
13 |
"pad_id": 0,
|
trainer_state.json
CHANGED
@@ -153,16 +153,16 @@
|
|
153 |
"step": 1020,
|
154 |
"total_flos": 5.148633647651021e+16,
|
155 |
"train_loss": 0.028946983113008386,
|
156 |
-
"train_runtime": 26.
|
157 |
-
"train_samples_per_second":
|
158 |
-
"train_steps_per_second": 38.
|
159 |
},
|
160 |
{
|
161 |
"epoch": 4.0,
|
162 |
"eval_loss": 1.3930128812789917,
|
163 |
-
"eval_runtime": 8.
|
164 |
-
"eval_samples_per_second":
|
165 |
-
"eval_steps_per_second": 11.
|
166 |
"step": 1020
|
167 |
}
|
168 |
],
|
|
|
153 |
"step": 1020,
|
154 |
"total_flos": 5.148633647651021e+16,
|
155 |
"train_loss": 0.028946983113008386,
|
156 |
+
"train_runtime": 26.7355,
|
157 |
+
"train_samples_per_second": 19525.044,
|
158 |
+
"train_steps_per_second": 38.152
|
159 |
},
|
160 |
{
|
161 |
"epoch": 4.0,
|
162 |
"eval_loss": 1.3930128812789917,
|
163 |
+
"eval_runtime": 8.3016,
|
164 |
+
"eval_samples_per_second": 1441.77,
|
165 |
+
"eval_steps_per_second": 11.323,
|
166 |
"step": 1020
|
167 |
}
|
168 |
],
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4664
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3345a9daf4130375c7a09b812dbb5af19f7b2a07a23d3827bb495e8766983668
|
3 |
size 4664
|