Commit
·
26cfee0
1
Parent(s):
1fc288f
Training in progress epoch 0
Browse files- README.md +6 -65
- config.json +1 -1
- generation_config.json +1 -1
- tf_model.h5 +1 -1
README.md
CHANGED
@@ -16,9 +16,9 @@ probably proofread and complete it, then remove this comment. -->
|
|
16 |
|
17 |
This model is a fine-tuned version of [t5-small](https://huggingface.co/t5-small) on an unknown dataset.
|
18 |
It achieves the following results on the evaluation set:
|
19 |
-
- Train Loss:
|
20 |
-
- Validation Loss:
|
21 |
-
- Epoch:
|
22 |
|
23 |
## Model description
|
24 |
|
@@ -44,71 +44,12 @@ The following hyperparameters were used during training:
|
|
44 |
|
45 |
| Train Loss | Validation Loss | Epoch |
|
46 |
|:----------:|:---------------:|:-----:|
|
47 |
-
| 4.
|
48 |
-
| 3.8859 | 3.0872 | 1 |
|
49 |
-
| 3.3048 | 2.5089 | 2 |
|
50 |
-
| 2.8571 | 2.1127 | 3 |
|
51 |
-
| 2.5441 | 1.8550 | 4 |
|
52 |
-
| 2.2831 | 1.6366 | 5 |
|
53 |
-
| 2.0725 | 1.4511 | 6 |
|
54 |
-
| 1.8948 | 1.2961 | 7 |
|
55 |
-
| 1.7461 | 1.1526 | 8 |
|
56 |
-
| 1.6041 | 1.0388 | 9 |
|
57 |
-
| 1.4667 | 0.9410 | 10 |
|
58 |
-
| 1.3698 | 0.8480 | 11 |
|
59 |
-
| 1.2537 | 0.7736 | 12 |
|
60 |
-
| 1.1784 | 0.6984 | 13 |
|
61 |
-
| 1.0971 | 0.6493 | 14 |
|
62 |
-
| 1.0204 | 0.5986 | 15 |
|
63 |
-
| 0.9592 | 0.5656 | 16 |
|
64 |
-
| 0.9040 | 0.5292 | 17 |
|
65 |
-
| 0.8568 | 0.5048 | 18 |
|
66 |
-
| 0.8097 | 0.4807 | 19 |
|
67 |
-
| 0.7699 | 0.4611 | 20 |
|
68 |
-
| 0.7361 | 0.4458 | 21 |
|
69 |
-
| 0.7109 | 0.4304 | 22 |
|
70 |
-
| 0.6740 | 0.4174 | 23 |
|
71 |
-
| 0.6603 | 0.4037 | 24 |
|
72 |
-
| 0.6272 | 0.3936 | 25 |
|
73 |
-
| 0.5996 | 0.3834 | 26 |
|
74 |
-
| 0.5899 | 0.3714 | 27 |
|
75 |
-
| 0.5650 | 0.3660 | 28 |
|
76 |
-
| 0.5594 | 0.3587 | 29 |
|
77 |
-
| 0.5349 | 0.3524 | 30 |
|
78 |
-
| 0.5199 | 0.3477 | 31 |
|
79 |
-
| 0.5176 | 0.3410 | 32 |
|
80 |
-
| 0.5016 | 0.3335 | 33 |
|
81 |
-
| 0.4984 | 0.3287 | 34 |
|
82 |
-
| 0.4807 | 0.3284 | 35 |
|
83 |
-
| 0.4772 | 0.3212 | 36 |
|
84 |
-
| 0.4633 | 0.3227 | 37 |
|
85 |
-
| 0.4606 | 0.3169 | 38 |
|
86 |
-
| 0.4466 | 0.3135 | 39 |
|
87 |
-
| 0.4366 | 0.3097 | 40 |
|
88 |
-
| 0.4307 | 0.3053 | 41 |
|
89 |
-
| 0.4264 | 0.3050 | 42 |
|
90 |
-
| 0.4263 | 0.3041 | 43 |
|
91 |
-
| 0.4171 | 0.3056 | 44 |
|
92 |
-
| 0.4124 | 0.2984 | 45 |
|
93 |
-
| 0.4066 | 0.3014 | 46 |
|
94 |
-
| 0.4050 | 0.2977 | 47 |
|
95 |
-
| 0.4014 | 0.2924 | 48 |
|
96 |
-
| 0.3939 | 0.2905 | 49 |
|
97 |
-
| 0.3951 | 0.2899 | 50 |
|
98 |
-
| 0.3886 | 0.2910 | 51 |
|
99 |
-
| 0.3878 | 0.2924 | 52 |
|
100 |
-
| 0.3835 | 0.2863 | 53 |
|
101 |
-
| 0.3766 | 0.2866 | 54 |
|
102 |
-
| 0.3777 | 0.2828 | 55 |
|
103 |
-
| 0.3688 | 0.2825 | 56 |
|
104 |
-
| 0.3665 | 0.2831 | 57 |
|
105 |
-
| 0.3717 | 0.2805 | 58 |
|
106 |
-
| 0.3661 | 0.2821 | 59 |
|
107 |
|
108 |
|
109 |
### Framework versions
|
110 |
|
111 |
-
- Transformers 4.
|
112 |
- TensorFlow 2.17.0
|
113 |
- Datasets 3.1.0
|
114 |
-
- Tokenizers 0.
|
|
|
16 |
|
17 |
This model is a fine-tuned version of [t5-small](https://huggingface.co/t5-small) on an unknown dataset.
|
18 |
It achieves the following results on the evaluation set:
|
19 |
+
- Train Loss: 4.7278
|
20 |
+
- Validation Loss: 3.8741
|
21 |
+
- Epoch: 0
|
22 |
|
23 |
## Model description
|
24 |
|
|
|
44 |
|
45 |
| Train Loss | Validation Loss | Epoch |
|
46 |
|:----------:|:---------------:|:-----:|
|
47 |
+
| 4.7278 | 3.8741 | 0 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
48 |
|
49 |
|
50 |
### Framework versions
|
51 |
|
52 |
+
- Transformers 4.46.1
|
53 |
- TensorFlow 2.17.0
|
54 |
- Datasets 3.1.0
|
55 |
+
- Tokenizers 0.20.2
|
config.json
CHANGED
@@ -54,7 +54,7 @@
|
|
54 |
"prefix": "translate English to Romanian: "
|
55 |
}
|
56 |
},
|
57 |
-
"transformers_version": "4.
|
58 |
"use_cache": true,
|
59 |
"vocab_size": 32128
|
60 |
}
|
|
|
54 |
"prefix": "translate English to Romanian: "
|
55 |
}
|
56 |
},
|
57 |
+
"transformers_version": "4.46.1",
|
58 |
"use_cache": true,
|
59 |
"vocab_size": 32128
|
60 |
}
|
generation_config.json
CHANGED
@@ -3,5 +3,5 @@
|
|
3 |
"decoder_start_token_id": 0,
|
4 |
"eos_token_id": 1,
|
5 |
"pad_token_id": 0,
|
6 |
-
"transformers_version": "4.
|
7 |
}
|
|
|
3 |
"decoder_start_token_id": 0,
|
4 |
"eos_token_id": 1,
|
5 |
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.46.1"
|
7 |
}
|
tf_model.h5
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 373902664
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2f622344f75cfd1101c0a5676b2ae70ea031bbc06276a5e50483fd3cf00fe1e5
|
3 |
size 373902664
|