jsalvad0r commited on
Commit
135117a
·
1 Parent(s): 640b4be

unit testing

Browse files
Files changed (2) hide show
  1. README.md +1 -1
  2. tests.py +65 -1
README.md CHANGED
@@ -82,7 +82,7 @@ print(metric.inputs_description)
82
  [//]: # (- **input_field** *(type): Definition of input, with explanation if necessary. State any default value(s).*)
83
 
84
  ### Output Values
85
- List of `Scores` dataclass corresponding to each sample -
86
 
87
  - `precision: float`: Precision score, which ranges from 0.0 to 1.0.
88
  - `recall: List[float]`: Recall score corresponding to each reference
 
82
  [//]: # (- **input_field** *(type): Definition of input, with explanation if necessary. State any default value(s).*)
83
 
84
  ### Output Values
85
+ Singleton/List of `Scores` dataclass corresponding to each sample -
86
 
87
  - `precision: float`: Precision score, which ranges from 0.0 to 1.0.
88
  - `recall: List[float]`: Recall score corresponding to each reference
tests.py CHANGED
@@ -249,7 +249,7 @@ class TestSemF1(unittest.TestCase):
249
  'this is the second prediction sample',
250
  ]
251
 
252
- def test_aggregate_flag(self):
253
  """
254
  check if a `Scores` class is returned instead of a list of
255
  `Scores`
@@ -266,6 +266,70 @@ class TestSemF1(unittest.TestCase):
266
  )
267
  self.assertIsInstance(scores, Scores)
268
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
269
 
270
  def test_untokenized_single_reference(self):
271
  scores = self.semf1_metric.compute(
 
249
  'this is the second prediction sample',
250
  ]
251
 
252
+ def test_aggregate_multi_sample(self):
253
  """
254
  check if a `Scores` class is returned instead of a list of
255
  `Scores`
 
266
  )
267
  self.assertIsInstance(scores, Scores)
268
 
269
+ def test_aggregate_untokenized_single_ref(self):
270
+ scores = self.semf1_metric.compute(
271
+ predictions=self.untokenized_single_reference_predictions,
272
+ references=self.untokenized_single_reference_references,
273
+ tokenize_sentences=True,
274
+ multi_references=False,
275
+ gpu=False,
276
+ batch_size=32,
277
+ verbose=False,
278
+ aggregate=True,
279
+ )
280
+ self.assertIsInstance(scores, Scores)
281
+
282
+ def test_aggregate_tokenized_single_ref(self):
283
+ scores = self.semf1_metric.compute(
284
+ predictions=self.tokenized_single_reference_predictions,
285
+ references=self.tokenized_single_reference_references,
286
+ tokenize_sentences=True,
287
+ multi_references=False,
288
+ gpu=False,
289
+ batch_size=32,
290
+ verbose=False,
291
+ aggregate=True,
292
+ )
293
+ self.assertIsInstance(scores, Scores)
294
+
295
+ def test_aggregate_untokenized_multi_ref(self):
296
+ scores = self.semf1_metric.compute(
297
+ predictions=self.untokenized_multi_reference_predictions,
298
+ references=self.untokenized_multi_reference_references,
299
+ tokenize_sentences=True,
300
+ multi_references=False,
301
+ gpu=False,
302
+ batch_size=32,
303
+ verbose=False,
304
+ aggregate=True,
305
+ )
306
+ self.assertIsInstance(scores, Scores)
307
+
308
+ def test_aggregate_tokenized_multi_ref(self):
309
+ scores = self.semf1_metric.compute(
310
+ predictions=self.tokenized_multi_reference_predictions,
311
+ references=self.tokenized_multi_reference_references,
312
+ tokenize_sentences=True,
313
+ multi_references=False,
314
+ gpu=False,
315
+ batch_size=32,
316
+ verbose=False,
317
+ aggregate=True,
318
+ )
319
+ self.assertIsInstance(scores, Scores)
320
+
321
+ def test_aggregate_same_pred_and_ref(self):
322
+ scores = self.semf1_metric.compute(
323
+ predictions=self.tokenized_single_reference_predictions,
324
+ references=self.tokenized_single_reference_predictions,
325
+ tokenize_sentences=True,
326
+ multi_references=False,
327
+ gpu=False,
328
+ batch_size=32,
329
+ verbose=False,
330
+ aggregate=True,
331
+ )
332
+ self.assertIsInstance(scores, Scores)
333
 
334
  def test_untokenized_single_reference(self):
335
  scores = self.semf1_metric.compute(