anz2 commited on
Commit
354cd04
·
1 Parent(s): 139bc02

update features for evaluation

Browse files
Files changed (1) hide show
  1. iliauniiccocrevaluation.py +97 -89
iliauniiccocrevaluation.py CHANGED
@@ -71,98 +71,106 @@ class IliauniIccOCREvaluation(evaluate.Metric):
71
  # This defines the format of each prediction and reference
72
  features=datasets.Features(
73
  {
74
- "predictions": datasets.Features(
75
- {
76
- "id": datasets.Value("string"),
77
- "filepath": datasets.Value("string"),
78
- "tags": datasets.Sequence(datasets.Value("string")),
79
- "metadata": datasets.Features(
80
- {
81
- "size_bytes": datasets.Value("int32"),
82
- "mime_type": datasets.Value("string"),
83
- "width": datasets.Value("int32"),
84
- "height": datasets.Value("int32"),
85
- "num_channels": datasets.Value("int32"),
86
- "author": datasets.Value("string"),
87
- "category": datasets.Value("string"),
88
- "document_name": datasets.Value("string"),
89
- "source": datasets.Value("string"),
90
- "year": datasets.Value("int32")
91
- }
92
- ),
93
- "_media_type": datasets.Value("string"),
94
- "_rand": datasets.Value("string"),
95
- "detections": datasets.Features(
96
- {
97
- "detections": datasets.Sequence(
98
- datasets.Features(
99
- {
100
- "id": datasets.Value("string"),
101
- "attributes": datasets.Sequence(datasets.Value("string")),
102
- "tags": datasets.Value("string"),
103
- "label": datasets.Value("string"),
104
- "bounding_box": datasets.Sequence(datasets.Value("float32")),
105
- "confidence": datasets.Value("float32"),
106
- "index": datasets.Value("int32"),
107
- "page": datasets.Value("int32"),
108
- "block": datasets.Value("int32"),
109
- "paragraph": datasets.Value("int32"),
110
- "word": datasets.Value("int32"),
111
- "text": datasets.Value("string"),
112
- }
 
 
113
  )
114
- )
115
- }
116
- ),
117
- "image": datasets.Image()
118
- }
 
 
119
  ),
120
- "references": datasets.Features(
121
- {
122
- "id": datasets.Value("string"),
123
- "filepath": datasets.Value("string"),
124
- "tags": datasets.Sequence(datasets.Value("string")),
125
- "metadata": datasets.Features(
126
- {
127
- "size_bytes": datasets.Value("int32"),
128
- "mime_type": datasets.Value("string"),
129
- "width": datasets.Value("int32"),
130
- "height": datasets.Value("int32"),
131
- "num_channels": datasets.Value("int32"),
132
- "author": datasets.Value("string"),
133
- "category": datasets.Value("string"),
134
- "document_name": datasets.Value("string"),
135
- "source": datasets.Value("string"),
136
- "year": datasets.Value("int32")
137
- }
138
- ),
139
- "_media_type": datasets.Value("string"),
140
- "_rand": datasets.Value("string"),
141
- "detections": datasets.Features(
142
- {
143
- "detections": datasets.Sequence(
144
- datasets.Features(
145
- {
146
- "id": datasets.Value("string"),
147
- "attributes": datasets.Sequence(datasets.Value("string")),
148
- "tags": datasets.Value("string"),
149
- "label": datasets.Value("string"),
150
- "bounding_box": datasets.Sequence(datasets.Value("float32")),
151
- "confidence": datasets.Value("float32"),
152
- "index": datasets.Value("int32"),
153
- "page": datasets.Value("int32"),
154
- "block": datasets.Value("int32"),
155
- "paragraph": datasets.Value("int32"),
156
- "word": datasets.Value("int32"),
157
- "text": datasets.Value("string"),
158
- }
 
 
159
  )
160
- )
161
- }
162
- ),
163
- "image": datasets.Image()
164
- }
165
- )
 
 
166
  }
167
  ),
168
  # Homepage of the module for documentation
 
71
  # This defines the format of each prediction and reference
72
  features=datasets.Features(
73
  {
74
+ "predictions": datasets.Sequence(
75
+ feature=datasets.Features(
76
+ {
77
+ "id": datasets.Value("string"),
78
+ "filepath": datasets.Value("string"),
79
+ "tags": datasets.Sequence(datasets.Value("string")),
80
+ "metadata": datasets.Features(
81
+ {
82
+ "size_bytes": datasets.Value("int32"),
83
+ "mime_type": datasets.Value("string"),
84
+ "width": datasets.Value("int32"),
85
+ "height": datasets.Value("int32"),
86
+ "num_channels": datasets.Value("int32"),
87
+ "author": datasets.Value("string"),
88
+ "category": datasets.Value("string"),
89
+ "document_name": datasets.Value("string"),
90
+ "source": datasets.Value("string"),
91
+ "year": datasets.Value("int32")
92
+ }
93
+ ),
94
+ "_media_type": datasets.Value("string"),
95
+ "_rand": datasets.Value("string"),
96
+ "detections": datasets.Features(
97
+ {
98
+ "detections": datasets.Sequence(
99
+ datasets.Features(
100
+ {
101
+ "id": datasets.Value("string"),
102
+ "attributes": datasets.Sequence(datasets.Value("string")),
103
+ "tags": datasets.Value("string"),
104
+ "label": datasets.Value("string"),
105
+ "bounding_box": datasets.Sequence(datasets.Value("float32")),
106
+ "confidence": datasets.Value("float32"),
107
+ "index": datasets.Value("int32"),
108
+ "page": datasets.Value("int32"),
109
+ "block": datasets.Value("int32"),
110
+ "paragraph": datasets.Value("int32"),
111
+ "word": datasets.Value("int32"),
112
+ "text": datasets.Value("string"),
113
+ }
114
+ )
115
  )
116
+ }
117
+ ),
118
+ "image": datasets.Image()
119
+ }
120
+ ),
121
+ length=-1,
122
+ id=None
123
  ),
124
+ "references": datasets.Sequence(
125
+ feature=datasets.Features(
126
+ {
127
+ "id": datasets.Value("string"),
128
+ "filepath": datasets.Value("string"),
129
+ "tags": datasets.Sequence(datasets.Value("string")),
130
+ "metadata": datasets.Features(
131
+ {
132
+ "size_bytes": datasets.Value("int32"),
133
+ "mime_type": datasets.Value("string"),
134
+ "width": datasets.Value("int32"),
135
+ "height": datasets.Value("int32"),
136
+ "num_channels": datasets.Value("int32"),
137
+ "author": datasets.Value("string"),
138
+ "category": datasets.Value("string"),
139
+ "document_name": datasets.Value("string"),
140
+ "source": datasets.Value("string"),
141
+ "year": datasets.Value("int32")
142
+ }
143
+ ),
144
+ "_media_type": datasets.Value("string"),
145
+ "_rand": datasets.Value("string"),
146
+ "detections": datasets.Features(
147
+ {
148
+ "detections": datasets.Sequence(
149
+ datasets.Features(
150
+ {
151
+ "id": datasets.Value("string"),
152
+ "attributes": datasets.Sequence(datasets.Value("string")),
153
+ "tags": datasets.Value("string"),
154
+ "label": datasets.Value("string"),
155
+ "bounding_box": datasets.Sequence(datasets.Value("float32")),
156
+ "confidence": datasets.Value("float32"),
157
+ "index": datasets.Value("int32"),
158
+ "page": datasets.Value("int32"),
159
+ "block": datasets.Value("int32"),
160
+ "paragraph": datasets.Value("int32"),
161
+ "word": datasets.Value("int32"),
162
+ "text": datasets.Value("string"),
163
+ }
164
+ )
165
  )
166
+ }
167
+ ),
168
+ "image": datasets.Image()
169
+ }
170
+ ),
171
+ length=-1,
172
+ id=None
173
+ ),
174
  }
175
  ),
176
  # Homepage of the module for documentation