unitxt.test_utils.metrics module

unitxt.test_utils.metrics.apply_metric(metric: Metric, predictions: List[Any], references: List[List[Any]], task_data: List[dict] | None = None, perform_validations_in_apply_metric=True)
unitxt.test_utils.metrics.dict_equal(dict1, dict2)
unitxt.test_utils.metrics.round_floats(obj, precision=2, recursive=True)
unitxt.test_utils.metrics.test_metric(metric: Metric, predictions: List[Any], references: List[List[Any]], instance_targets: List[dict], global_target: dict, task_data: List[dict] | None = None)