anz2 commited on
Commit
5b32cc2
·
1 Parent(s): beac683

update features for evaluation

Browse files
Files changed (1) hide show
  1. iliauniiccocrevaluation.py +96 -38
iliauniiccocrevaluation.py CHANGED
@@ -71,48 +71,106 @@ class IliauniIccOCREvaluation(evaluate.Metric):
71
  # This defines the format of each prediction and reference
72
  features=datasets.Features(
73
  {
74
- "id": datasets.Value("string"),
75
- "filepath": datasets.Value("string"),
76
- "tags": datasets.Sequence(datasets.Value("string")),
77
- "metadata": datasets.Features(
78
- {
79
- "size_bytes": datasets.Value("int32"),
80
- "mime_type": datasets.Value("string"),
81
- "width": datasets.Value("int32"),
82
- "height": datasets.Value("int32"),
83
- "num_channels": datasets.Value("int32"),
84
- "author": datasets.Value("string"),
85
- "category": datasets.Value("string"),
86
- "document_name": datasets.Value("string"),
87
- "source": datasets.Value("string"),
88
- "year": datasets.Value("int32")
89
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  ),
91
- "_media_type": datasets.Value("string"),
92
- "_rand": datasets.Value("string"),
93
- "detections": datasets.Features(
94
- {
95
- "detections": datasets.Sequence(
96
- datasets.Features(
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
97
  {
98
- "id": datasets.Value("string"),
99
- "attributes": datasets.Sequence(datasets.Value("string")),
100
- "tags": datasets.Value("string"),
101
- "label": datasets.Value("string"),
102
- "bounding_box": datasets.Sequence(datasets.Value("float32")),
103
- "confidence": datasets.Value("float32"),
104
- "index": datasets.Value("int32"),
105
- "page": datasets.Value("int32"),
106
- "block": datasets.Value("int32"),
107
- "paragraph": datasets.Value("int32"),
108
- "word": datasets.Value("int32"),
109
- "text": datasets.Value("string"),
 
 
 
 
 
 
110
  }
111
- )
112
- )
113
- }
 
 
 
114
  ),
115
- "image": datasets.Image(),
116
  }
117
  ),
118
  # Homepage of the module for documentation
 
71
  # This defines the format of each prediction and reference
72
  features=datasets.Features(
73
  {
74
+ "predictions": datasets.Sequence(
75
+ feature=datasets.Features(
76
+ {
77
+ "id": datasets.Value("string"),
78
+ "filepath": datasets.Value("string"),
79
+ "tags": datasets.Sequence(datasets.Value("string")),
80
+ "metadata": datasets.Features(
81
+ {
82
+ "size_bytes": datasets.Value("int32"),
83
+ "mime_type": datasets.Value("string"),
84
+ "width": datasets.Value("int32"),
85
+ "height": datasets.Value("int32"),
86
+ "num_channels": datasets.Value("int32"),
87
+ "author": datasets.Value("string"),
88
+ "category": datasets.Value("string"),
89
+ "document_name": datasets.Value("string"),
90
+ "source": datasets.Value("string"),
91
+ "year": datasets.Value("int32")
92
+ }
93
+ ),
94
+ "_media_type": datasets.Value("string"),
95
+ "_rand": datasets.Value("string"),
96
+ "detections": datasets.Features(
97
+ {
98
+ "detections": datasets.Sequence(
99
+ datasets.Features(
100
+ {
101
+ "id": datasets.Value("string"),
102
+ "attributes": datasets.Sequence(datasets.Value("string")),
103
+ "tags": datasets.Value("string"),
104
+ "label": datasets.Value("string"),
105
+ "bounding_box": datasets.Sequence(datasets.Value("float32")),
106
+ "confidence": datasets.Value("float32"),
107
+ "index": datasets.Value("int32"),
108
+ "page": datasets.Value("int32"),
109
+ "block": datasets.Value("int32"),
110
+ "paragraph": datasets.Value("int32"),
111
+ "word": datasets.Value("int32"),
112
+ "text": datasets.Value("string"),
113
+ }
114
+ )
115
+ )
116
+ }
117
+ ),
118
+ "image": datasets.Image()
119
+ }
120
+ ),
121
+ length=-1,
122
+ id=None
123
  ),
124
+ "references": datasets.Sequence(
125
+ feature=datasets.Features(
126
+ {
127
+ "id": datasets.Value("string"),
128
+ "filepath": datasets.Value("string"),
129
+ "tags": datasets.Sequence(datasets.Value("string")),
130
+ "metadata": datasets.Features(
131
+ {
132
+ "size_bytes": datasets.Value("int32"),
133
+ "mime_type": datasets.Value("string"),
134
+ "width": datasets.Value("int32"),
135
+ "height": datasets.Value("int32"),
136
+ "num_channels": datasets.Value("int32"),
137
+ "author": datasets.Value("string"),
138
+ "category": datasets.Value("string"),
139
+ "document_name": datasets.Value("string"),
140
+ "source": datasets.Value("string"),
141
+ "year": datasets.Value("int32")
142
+ }
143
+ ),
144
+ "_media_type": datasets.Value("string"),
145
+ "_rand": datasets.Value("string"),
146
+ "detections": datasets.Features(
147
  {
148
+ "detections": datasets.Sequence(
149
+ datasets.Features(
150
+ {
151
+ "id": datasets.Value("string"),
152
+ "attributes": datasets.Sequence(datasets.Value("string")),
153
+ "tags": datasets.Value("string"),
154
+ "label": datasets.Value("string"),
155
+ "bounding_box": datasets.Sequence(datasets.Value("float32")),
156
+ "confidence": datasets.Value("float32"),
157
+ "index": datasets.Value("int32"),
158
+ "page": datasets.Value("int32"),
159
+ "block": datasets.Value("int32"),
160
+ "paragraph": datasets.Value("int32"),
161
+ "word": datasets.Value("int32"),
162
+ "text": datasets.Value("string"),
163
+ }
164
+ )
165
+ )
166
  }
167
+ ),
168
+ "image": datasets.Image()
169
+ }
170
+ ),
171
+ length=-1,
172
+ id=None
173
  ),
 
174
  }
175
  ),
176
  # Homepage of the module for documentation