davelotito
commited on
End of training
Browse files
README.md
CHANGED
@@ -18,15 +18,15 @@ should probably proofread and complete it, then remove this comment. -->
|
|
18 |
|
19 |
This model is a fine-tuned version of [naver-clova-ix/donut-base](https://huggingface.co/naver-clova-ix/donut-base) on the None dataset.
|
20 |
It achieves the following results on the evaluation set:
|
21 |
-
- Loss: 0.
|
22 |
-
- Bleu: 0.
|
23 |
-
- Precisions: [0.
|
24 |
-
- Brevity Penalty: 0.
|
25 |
-
- Length Ratio: 0.
|
26 |
-
- Translation Length:
|
27 |
-
- Reference Length:
|
28 |
-
- Cer: 0.
|
29 |
-
- Wer: 0.
|
30 |
|
31 |
## Model description
|
32 |
|
@@ -58,12 +58,12 @@ The following hyperparameters were used during training:
|
|
58 |
|
59 |
### Training results
|
60 |
|
61 |
-
| Training Loss | Epoch | Step | Validation Loss | Bleu | Precisions
|
62 |
-
|
63 |
-
|
|
64 |
-
| 1.
|
65 |
-
| 0.
|
66 |
-
| 0.
|
67 |
|
68 |
|
69 |
### Framework versions
|
|
|
18 |
|
19 |
This model is a fine-tuned version of [naver-clova-ix/donut-base](https://huggingface.co/naver-clova-ix/donut-base) on the None dataset.
|
20 |
It achieves the following results on the evaluation set:
|
21 |
+
- Loss: 0.4919
|
22 |
+
- Bleu: 0.0652
|
23 |
+
- Precisions: [0.7938775510204081, 0.7020785219399538, 0.6462765957446809, 0.6050156739811913]
|
24 |
+
- Brevity Penalty: 0.0955
|
25 |
+
- Length Ratio: 0.2986
|
26 |
+
- Translation Length: 490
|
27 |
+
- Reference Length: 1641
|
28 |
+
- Cer: 0.7510
|
29 |
+
- Wer: 0.8349
|
30 |
|
31 |
## Model description
|
32 |
|
|
|
58 |
|
59 |
### Training results
|
60 |
|
61 |
+
| Training Loss | Epoch | Step | Validation Loss | Bleu | Precisions | Brevity Penalty | Length Ratio | Translation Length | Reference Length | Cer | Wer |
|
62 |
+
|:-------------:|:-----:|:----:|:---------------:|:------:|:--------------------------------------------------------------------------------:|:---------------:|:------------:|:------------------:|:----------------:|:------:|:------:|
|
63 |
+
| 4.0081 | 1.0 | 253 | 1.6452 | 0.0 | [0.4795539033457249, 0.14622641509433962, 0.03205128205128205, 0.0] | 0.0061 | 0.1639 | 269 | 1641 | 0.8712 | 0.9425 |
|
64 |
+
| 1.2573 | 2.0 | 506 | 0.6901 | 0.0379 | [0.6787234042553192, 0.5036319612590799, 0.4044943820224719, 0.3177257525083612] | 0.0828 | 0.2864 | 470 | 1641 | 0.7727 | 0.8821 |
|
65 |
+
| 0.9461 | 3.0 | 759 | 0.5654 | 0.0600 | [0.7469635627530364, 0.631578947368421, 0.5684210526315789, 0.5232198142414861] | 0.0981 | 0.3010 | 494 | 1641 | 0.7547 | 0.8479 |
|
66 |
+
| 0.669 | 4.0 | 1012 | 0.4919 | 0.0652 | [0.7938775510204081, 0.7020785219399538, 0.6462765957446809, 0.6050156739811913] | 0.0955 | 0.2986 | 490 | 1641 | 0.7510 | 0.8349 |
|
67 |
|
68 |
|
69 |
### Framework versions
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 809103512
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:104888ca0d41c70c59de232edcba580a9e5859acecf2e99ced6602b8d02f41ac
|
3 |
size 809103512
|
runs/May07_23-44-12_ip-172-16-110-63.ec2.internal/events.out.tfevents.1715125454.ip-172-16-110-63.ec2.internal.9395.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42c6ca5ebcf7911bd35bfe280c452bb7d500e498802fec79a8cc08366f221cd0
|
3 |
+
size 14383
|
special_tokens_map.json
CHANGED
@@ -63,20 +63,6 @@
|
|
63 |
"rstrip": false,
|
64 |
"single_word": false
|
65 |
},
|
66 |
-
{
|
67 |
-
"content": "</s>",
|
68 |
-
"lstrip": false,
|
69 |
-
"normalized": false,
|
70 |
-
"rstrip": false,
|
71 |
-
"single_word": false
|
72 |
-
},
|
73 |
-
{
|
74 |
-
"content": "<s>",
|
75 |
-
"lstrip": false,
|
76 |
-
"normalized": false,
|
77 |
-
"rstrip": false,
|
78 |
-
"single_word": false
|
79 |
-
},
|
80 |
{
|
81 |
"content": "</s>",
|
82 |
"lstrip": false,
|
|
|
63 |
"rstrip": false,
|
64 |
"single_word": false
|
65 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
66 |
{
|
67 |
"content": "</s>",
|
68 |
"lstrip": false,
|
tokenizer_config.json
CHANGED
@@ -139,8 +139,6 @@
|
|
139 |
"<s_address>",
|
140 |
"</s_address>",
|
141 |
"<s>",
|
142 |
-
"</s>",
|
143 |
-
"<s>",
|
144 |
"</s>"
|
145 |
],
|
146 |
"bos_token": "<s>",
|
|
|
139 |
"<s_address>",
|
140 |
"</s_address>",
|
141 |
"<s>",
|
|
|
|
|
142 |
"</s>"
|
143 |
],
|
144 |
"bos_token": "<s>",
|