training completed[dev]: 512 128

Browse files

Files changed (5) hide show

README.md +22 -21
all_results.json +10 -10
model.safetensors +1 -1
runs/Mar31_15-48-53_053f5f175b48/events.out.tfevents.1711900137.053f5f175b48.166.0 +2 -2
test_results.json +10 -10

README.md CHANGED Viewed

@@ -18,13 +18,13 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.1670
-- Rouge1: 0.6791
-- Rouge2: 0.4136
-- Rougel: 0.6183
-- Rougelsum: 0.6185
-- Wer: 0.4846
-- Bleurt: 0.3314
 ## Model description
@@ -56,20 +56,21 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Wer    | Bleurt |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:------:|:------:|
-| No log        | 0.14  | 250  | 1.3197          | 0.6548 | 0.3804 | 0.5904 | 0.5905    | 0.5188 | 0.3009 |
-| 1.7026        | 0.27  | 500  | 1.2676          | 0.6613 | 0.3904 | 0.5985 | 0.5987    | 0.5074 | 0.3009 |
-| 1.7026        | 0.41  | 750  | 1.2385          | 0.6664 | 0.3961 | 0.6043 | 0.6044    | 0.5023 | 0.3009 |
-| 1.3446        | 0.55  | 1000 | 1.2234          | 0.6691 | 0.4009 | 0.6075 | 0.6076    | 0.4972 | 0.3009 |
-| 1.3446        | 0.68  | 1250 | 1.2089          | 0.671  | 0.4031 | 0.6099 | 0.6101    | 0.4944 | 0.3009 |
-| 1.309         | 0.82  | 1500 | 1.1983          | 0.673  | 0.4064 | 0.6121 | 0.6123    | 0.4914 | 0.3009 |
-| 1.309         | 0.96  | 1750 | 1.1900          | 0.6744 | 0.4075 | 0.6136 | 0.6137    | 0.4897 | 0.3009 |
-| 1.2783        | 1.09  | 2000 | 1.1840          | 0.6744 | 0.4082 | 0.614  | 0.6141    | 0.4889 | 0.2798 |
-| 1.2783        | 1.23  | 2250 | 1.1808          | 0.6759 | 0.4102 | 0.6154 | 0.6156    | 0.4875 | 0.2944 |
-| 1.2683        | 1.36  | 2500 | 1.1763          | 0.6771 | 0.4111 | 0.6163 | 0.6165    | 0.4863 | 0.3153 |
-| 1.2683        | 1.5   | 2750 | 1.1720          | 0.6772 | 0.4115 | 0.6169 | 0.617     | 0.4859 | 0.4109 |
-| 1.2469        | 1.64  | 3000 | 1.1701          | 0.6783 | 0.4127 | 0.6176 | 0.6178    | 0.485  | 0.3314 |
-| 1.2469        | 1.77  | 3250 | 1.1680          | 0.6786 | 0.4131 | 0.6178 | 0.6179    | 0.4849 | 0.3314 |
-| 1.2171        | 1.91  | 3500 | 1.1670          | 0.6791 | 0.4136 | 0.6183 | 0.6185    | 0.4846 | 0.3314 |
 ### Framework versions

 This model is a fine-tuned version of [t5-base](https://huggingface.co/t5-base) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 1.1785
+- Rouge1: 0.6772
+- Rouge2: 0.4105
+- Rougel: 0.6161
+- Rougelsum: 0.6161
+- Wer: 0.4869
+- Bleurt: 0.3779
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss | Rouge1 | Rouge2 | Rougel | Rougelsum | Wer    | Bleurt |
 |:-------------:|:-----:|:----:|:---------------:|:------:|:------:|:------:|:---------:|:------:|:------:|
+| No log        | 0.13  | 250  | 1.3316          | 0.6509 | 0.3768 | 0.5866 | 0.5865    | 0.5217 | 0.3009 |
+| 1.7919        | 0.27  | 500  | 1.2776          | 0.6593 | 0.3865 | 0.5962 | 0.5962    | 0.5108 | 0.3009 |
+| 1.7919        | 0.4   | 750  | 1.2513          | 0.6633 | 0.3931 | 0.6015 | 0.6014    | 0.5039 | 0.3009 |
+| 1.3552        | 0.53  | 1000 | 1.2326          | 0.6667 | 0.3967 | 0.6048 | 0.6047    | 0.5008 | 0.3009 |
+| 1.3552        | 0.66  | 1250 | 1.2236          | 0.669  | 0.4    | 0.6072 | 0.6072    | 0.4972 | 0.3314 |
+| 1.3074        | 0.8   | 1500 | 1.2118          | 0.6711 | 0.4022 | 0.6093 | 0.6093    | 0.4953 | 0.3314 |
+| 1.3074        | 0.93  | 1750 | 1.2022          | 0.6714 | 0.4034 | 0.6105 | 0.6104    | 0.4932 | 0.2798 |
+| 1.3037        | 1.06  | 2000 | 1.1972          | 0.673  | 0.4053 | 0.6117 | 0.6116    | 0.4916 | 0.3771 |
+| 1.3037        | 1.2   | 2250 | 1.1909          | 0.6749 | 0.4068 | 0.6136 | 0.6135    | 0.4905 | 0.3314 |
+| 1.2676        | 1.33  | 2500 | 1.1889          | 0.676  | 0.4086 | 0.6143 | 0.6143    | 0.4893 | 0.3314 |
+| 1.2676        | 1.46  | 2750 | 1.1848          | 0.6763 | 0.4091 | 0.615  | 0.6149    | 0.4884 | 0.3314 |
+| 1.2796        | 1.6   | 3000 | 1.1829          | 0.677  | 0.4095 | 0.6154 | 0.6154    | 0.488  | 0.3123 |
+| 1.2796        | 1.73  | 3250 | 1.1808          | 0.6767 | 0.41   | 0.6157 | 0.6157    | 0.4876 | 0.3779 |
+| 1.2489        | 1.86  | 3500 | 1.1787          | 0.6771 | 0.4105 | 0.616  | 0.616     | 0.4869 | 0.3771 |
+| 1.2489        | 1.99  | 3750 | 1.1785          | 0.6772 | 0.4105 | 0.6161 | 0.6161    | 0.4869 | 0.3779 |
 ### Framework versions

all_results.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
-    "test_BLEURT": -0.2487,
-    "test_WER": 0.4777,
-    "test_loss": 1.1913501024246216,
-    "test_rouge1": 0.6851,
-    "test_rouge2": 0.4239,
-    "test_rougeL": 0.6255,
-    "test_rougeLsum": 0.6251,
-    "test_runtime": 47.9856,
-    "test_samples_per_second": 7.648,
-    "test_steps_per_second": 1.292
 }

 {
+    "test_BLEURT": -0.9706,
+    "test_WER": 0.4816,
+    "test_loss": 1.195426344871521,
+    "test_rouge1": 0.6827,
+    "test_rouge2": 0.4184,
+    "test_rougeL": 0.6228,
+    "test_rougeLsum": 0.6222,
+    "test_runtime": 31.0979,
+    "test_samples_per_second": 12.123,
+    "test_steps_per_second": 2.026
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef53db75fbd2803ab867085b85fad40af51c1f686667f9acbf045005d951f1e4
 size 891644712

 version https://git-lfs.github.com/spec/v1
+oid sha256:0b9613afbb9d6a6140659f4336ce375e04d821d1506dcda5db5e31ff0cf1c38a
 size 891644712

runs/Mar31_15-48-53_053f5f175b48/events.out.tfevents.1711900137.053f5f175b48.166.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d1173f01f2dc35a167659a6be47134b46c6da675448bb23205c33e911aff38a8
-size 10983

 version https://git-lfs.github.com/spec/v1
+oid sha256:263252bfd89a1284835ab1bc74cb6ee3548261c4494ade5f8a36a236215da838
+size 15967

test_results.json CHANGED Viewed

@@ -1,12 +1,12 @@
 {
-    "test_BLEURT": -0.2487,
-    "test_WER": 0.4777,
-    "test_loss": 1.1913501024246216,
-    "test_rouge1": 0.6851,
-    "test_rouge2": 0.4239,
-    "test_rougeL": 0.6255,
-    "test_rougeLsum": 0.6251,
-    "test_runtime": 47.9856,
-    "test_samples_per_second": 7.648,
-    "test_steps_per_second": 1.292
 }

 {
+    "test_BLEURT": -0.9706,
+    "test_WER": 0.4816,
+    "test_loss": 1.195426344871521,
+    "test_rouge1": 0.6827,
+    "test_rouge2": 0.4184,
+    "test_rougeL": 0.6228,
+    "test_rougeLsum": 0.6222,
+    "test_runtime": 31.0979,
+    "test_samples_per_second": 12.123,
+    "test_steps_per_second": 2.026
 }