Assignment based metrics

ie_eval.metrics.assignment_based

Compute the reading-order-independent ECER/EWER/Nerval metrics from a label/prediction dataset.

Attributes

logger `module-attribute`

logger = getLogger(__name__)

Classes

Functions

compute_oiecerewer

compute_oiecerewer(
    label_dir: Path,
    prediction_dir: Path,
    by_category: bool = False,
    print_table: bool = True,
) -> PrettyTable

Compute reading-order-independent ECER and EWER metrics.

Parameters:

Name	Type	Description	Default
`label_dir`	`Path`	Path to the directory containing BIO label files.	required
`prediction_dir`	`Path`	Path to the directory containing BIO prediction files.	required
`by_category`	`bool`	Whether to compute the metric globally or for each category. Defaults to False. (Not implemented yet)	`False`
`print_table`	`bool`	Whether to print the table. Defaults to True.	`True`

Returns:

Name	Type	Description
`PrettyTable`	`PrettyTable`	The evaluation table formatted in Markdown.

Source code in ie_eval/metrics/assignment_based.py

def compute_oiecerewer(
    label_dir: Path,
    prediction_dir: Path,
    by_category: bool = False,
    print_table: bool = True,
) -> PrettyTable:
    """Compute reading-order-independent ECER and EWER metrics.

    Args:
        label_dir (Path): Path to the directory containing BIO label files.
        prediction_dir (Path): Path to the directory containing BIO prediction files.
        by_category (bool, optional): Whether to compute the metric globally or for each category. Defaults to False. (Not implemented yet)
        print_table (bool, optional): Whether to print the table. Defaults to True.

    Returns:
        PrettyTable: The evaluation table formatted in Markdown.
    """
    dataset = load_dataset(label_dir, prediction_dir)
    # Initialize scores
    ecer_total_score_err = MicroAverageErrorRate()
    ewer_total_score_err = MicroAverageErrorRate()

    # Iterate over the dataset
    for label, prediction in dataset:
        ecer_score = OiEcerEwer(
            labels=label.entities,
            predictions=prediction.entities,
            compute_ecer=True,
        )

        ewer_score = OiEcerEwer(
            labels=label.entities,
            predictions=prediction.entities,
            compute_ecer=False,
        )

        # Micro average
        ecer_total_score_err.update(GLOBAL_STAT_NAME, ecer_score)
        ewer_total_score_err.update(GLOBAL_STAT_NAME, ewer_score)

        # TODO: https://gitlab.teklia.com/ner/metrics/ie-eval/-/issues/12
        if by_category:
            continue

    # Format and display results
    table = make_oi_ecer_ewer_prettytable(
        ecer_total_score_err,
        ewer_total_score_err,
    )
    if print_table:
        print(table)  # noqa: T201
    return table

compute_oinerval

compute_oinerval(
    label_dir: Path,
    prediction_dir: Path,
    nerval_threshold: float = 0.0,
    by_category: bool = False,
    print_table: bool = True,
) -> PrettyTable

Compute reading-order-independent Nerval Precision, Recall and F1 scores.