Spaces:
Runtime error
Runtime error
unit testing
Browse files
README.md
CHANGED
|
@@ -82,7 +82,7 @@ print(metric.inputs_description)
|
|
| 82 |
[//]: # (- **input_field** *(type): Definition of input, with explanation if necessary. State any default value(s).*)
|
| 83 |
|
| 84 |
### Output Values
|
| 85 |
-
List of `Scores` dataclass corresponding to each sample -
|
| 86 |
|
| 87 |
- `precision: float`: Precision score, which ranges from 0.0 to 1.0.
|
| 88 |
- `recall: List[float]`: Recall score corresponding to each reference
|
|
|
|
| 82 |
[//]: # (- **input_field** *(type): Definition of input, with explanation if necessary. State any default value(s).*)
|
| 83 |
|
| 84 |
### Output Values
|
| 85 |
+
Singleton/List of `Scores` dataclass corresponding to each sample -
|
| 86 |
|
| 87 |
- `precision: float`: Precision score, which ranges from 0.0 to 1.0.
|
| 88 |
- `recall: List[float]`: Recall score corresponding to each reference
|
tests.py
CHANGED
|
@@ -249,7 +249,7 @@ class TestSemF1(unittest.TestCase):
|
|
| 249 |
'this is the second prediction sample',
|
| 250 |
]
|
| 251 |
|
| 252 |
-
def
|
| 253 |
"""
|
| 254 |
check if a `Scores` class is returned instead of a list of
|
| 255 |
`Scores`
|
|
@@ -266,6 +266,70 @@ class TestSemF1(unittest.TestCase):
|
|
| 266 |
)
|
| 267 |
self.assertIsInstance(scores, Scores)
|
| 268 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 269 |
|
| 270 |
def test_untokenized_single_reference(self):
|
| 271 |
scores = self.semf1_metric.compute(
|
|
|
|
| 249 |
'this is the second prediction sample',
|
| 250 |
]
|
| 251 |
|
| 252 |
+
def test_aggregate_multi_sample(self):
|
| 253 |
"""
|
| 254 |
check if a `Scores` class is returned instead of a list of
|
| 255 |
`Scores`
|
|
|
|
| 266 |
)
|
| 267 |
self.assertIsInstance(scores, Scores)
|
| 268 |
|
| 269 |
+
def test_aggregate_untokenized_single_ref(self):
|
| 270 |
+
scores = self.semf1_metric.compute(
|
| 271 |
+
predictions=self.untokenized_single_reference_predictions,
|
| 272 |
+
references=self.untokenized_single_reference_references,
|
| 273 |
+
tokenize_sentences=True,
|
| 274 |
+
multi_references=False,
|
| 275 |
+
gpu=False,
|
| 276 |
+
batch_size=32,
|
| 277 |
+
verbose=False,
|
| 278 |
+
aggregate=True,
|
| 279 |
+
)
|
| 280 |
+
self.assertIsInstance(scores, Scores)
|
| 281 |
+
|
| 282 |
+
def test_aggregate_tokenized_single_ref(self):
|
| 283 |
+
scores = self.semf1_metric.compute(
|
| 284 |
+
predictions=self.tokenized_single_reference_predictions,
|
| 285 |
+
references=self.tokenized_single_reference_references,
|
| 286 |
+
tokenize_sentences=True,
|
| 287 |
+
multi_references=False,
|
| 288 |
+
gpu=False,
|
| 289 |
+
batch_size=32,
|
| 290 |
+
verbose=False,
|
| 291 |
+
aggregate=True,
|
| 292 |
+
)
|
| 293 |
+
self.assertIsInstance(scores, Scores)
|
| 294 |
+
|
| 295 |
+
def test_aggregate_untokenized_multi_ref(self):
|
| 296 |
+
scores = self.semf1_metric.compute(
|
| 297 |
+
predictions=self.untokenized_multi_reference_predictions,
|
| 298 |
+
references=self.untokenized_multi_reference_references,
|
| 299 |
+
tokenize_sentences=True,
|
| 300 |
+
multi_references=False,
|
| 301 |
+
gpu=False,
|
| 302 |
+
batch_size=32,
|
| 303 |
+
verbose=False,
|
| 304 |
+
aggregate=True,
|
| 305 |
+
)
|
| 306 |
+
self.assertIsInstance(scores, Scores)
|
| 307 |
+
|
| 308 |
+
def test_aggregate_tokenized_multi_ref(self):
|
| 309 |
+
scores = self.semf1_metric.compute(
|
| 310 |
+
predictions=self.tokenized_multi_reference_predictions,
|
| 311 |
+
references=self.tokenized_multi_reference_references,
|
| 312 |
+
tokenize_sentences=True,
|
| 313 |
+
multi_references=False,
|
| 314 |
+
gpu=False,
|
| 315 |
+
batch_size=32,
|
| 316 |
+
verbose=False,
|
| 317 |
+
aggregate=True,
|
| 318 |
+
)
|
| 319 |
+
self.assertIsInstance(scores, Scores)
|
| 320 |
+
|
| 321 |
+
def test_aggregate_same_pred_and_ref(self):
|
| 322 |
+
scores = self.semf1_metric.compute(
|
| 323 |
+
predictions=self.tokenized_single_reference_predictions,
|
| 324 |
+
references=self.tokenized_single_reference_predictions,
|
| 325 |
+
tokenize_sentences=True,
|
| 326 |
+
multi_references=False,
|
| 327 |
+
gpu=False,
|
| 328 |
+
batch_size=32,
|
| 329 |
+
verbose=False,
|
| 330 |
+
aggregate=True,
|
| 331 |
+
)
|
| 332 |
+
self.assertIsInstance(scores, Scores)
|
| 333 |
|
| 334 |
def test_untokenized_single_reference(self):
|
| 335 |
scores = self.semf1_metric.compute(
|