Commit
·
8567f52
1
Parent(s):
2e7a892
End of training
Browse files
README.md
CHANGED
@@ -13,10 +13,10 @@ should probably proofread and complete it, then remove this comment. -->
|
|
13 |
|
14 |
This model was trained from scratch on an unknown dataset.
|
15 |
It achieves the following results on the evaluation set:
|
16 |
-
- eval_loss: 4.
|
17 |
-
- eval_runtime: 0.
|
18 |
-
- eval_samples_per_second:
|
19 |
-
- eval_steps_per_second:
|
20 |
- epoch: 1.0
|
21 |
- step: 1
|
22 |
|
@@ -44,6 +44,7 @@ The following hyperparameters were used during training:
|
|
44 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
45 |
- lr_scheduler_type: linear
|
46 |
- num_epochs: 50
|
|
|
47 |
|
48 |
### Framework versions
|
49 |
|
|
|
13 |
|
14 |
This model was trained from scratch on an unknown dataset.
|
15 |
It achieves the following results on the evaluation set:
|
16 |
+
- eval_loss: 4.4161
|
17 |
+
- eval_runtime: 0.0471
|
18 |
+
- eval_samples_per_second: 42.424
|
19 |
+
- eval_steps_per_second: 21.212
|
20 |
- epoch: 1.0
|
21 |
- step: 1
|
22 |
|
|
|
44 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
45 |
- lr_scheduler_type: linear
|
46 |
- num_epochs: 50
|
47 |
+
- mixed_precision_training: Native AMP
|
48 |
|
49 |
### Framework versions
|
50 |
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 435820636
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57c96db9d72fa11361de659173136028f7c98934637d89b5f50a34f0c4d7a41e
|
3 |
size 435820636
|
runs/Jan05_08-13-40_414819e23027/events.out.tfevents.1704442424.414819e23027.9579.18
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d5157e976a6c0bdfd0a3264cdbbda96d2b8287516e29c3ea1dfa6732ed71e2c
|
3 |
+
size 8267
|
runs/Jan05_08-15-17_414819e23027/events.out.tfevents.1704442521.414819e23027.9579.19
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef06bc349a69160ba31249b711101a42ea1e9a342205f04cb0869354d3de3dac
|
3 |
+
size 7846
|
trainer_state.json
CHANGED
@@ -11,15 +11,15 @@
|
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
"learning_rate": 4.9e-05,
|
14 |
-
"loss": 1.
|
15 |
"step": 1
|
16 |
},
|
17 |
{
|
18 |
"epoch": 1.0,
|
19 |
-
"eval_loss": 4.
|
20 |
-
"eval_runtime": 0.
|
21 |
-
"eval_samples_per_second":
|
22 |
-
"eval_steps_per_second":
|
23 |
"step": 1
|
24 |
}
|
25 |
],
|
|
|
11 |
{
|
12 |
"epoch": 1.0,
|
13 |
"learning_rate": 4.9e-05,
|
14 |
+
"loss": 1.6172,
|
15 |
"step": 1
|
16 |
},
|
17 |
{
|
18 |
"epoch": 1.0,
|
19 |
+
"eval_loss": 4.416090965270996,
|
20 |
+
"eval_runtime": 0.0471,
|
21 |
+
"eval_samples_per_second": 42.424,
|
22 |
+
"eval_steps_per_second": 21.212,
|
23 |
"step": 1
|
24 |
}
|
25 |
],
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4600
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b966ffecbed91c5a0f2c413b6fea27a6d5dcd1ad5d43f2d92aea5836886021b2
|
3 |
size 4600
|