QuAcc/quacc/evaluation/method.py

from functools import wraps

import numpy as np
import sklearn.metrics as metrics
from quapy.data import LabelledCollection
from quapy.protocol import AbstractStochasticSeededProtocol
from sklearn.base import BaseEstimator

import quacc.error as error
from quacc.evaluation.report import EvaluationReport

from ..estimator import (
    AccuracyEstimator,
    BinaryQuantifierAccuracyEstimator,
    MulticlassAccuracyEstimator,
)

_methods = {}


def method(func):
    @wraps(func)
    def wrapper(c_model, validation, protocol):
        return func(c_model, validation, protocol)

    _methods[func.__name__] = wrapper

    return wrapper


def estimate(
    estimator: AccuracyEstimator,
    protocol: AbstractStochasticSeededProtocol,
):
    base_prevs, true_prevs, estim_prevs, pred_probas, labels = [], [], [], [], []
    for sample in protocol():
        e_sample, pred_proba = estimator.extend(sample)
        estim_prev = estimator.estimate(e_sample.X, ext=True)
        base_prevs.append(sample.prevalence())
        true_prevs.append(e_sample.prevalence())
        estim_prevs.append(estim_prev)
        pred_probas.append(pred_proba)
        labels.append(sample.y)

    return base_prevs, true_prevs, estim_prevs, pred_probas, labels


def evaluation_report(
    estimator: AccuracyEstimator,
    protocol: AbstractStochasticSeededProtocol,
    method: str,
) -> EvaluationReport:
    base_prevs, true_prevs, estim_prevs, pred_probas, labels = estimate(
        estimator, protocol
    )
    report = EvaluationReport(name=method)

    for base_prev, true_prev, estim_prev, pred_proba, label in zip(
        base_prevs, true_prevs, estim_prevs, pred_probas, labels
    ):
        pred = np.argmax(pred_proba, axis=-1)
        acc_score = error.acc(estim_prev)
        f1_score = error.f1(estim_prev)
        report.append_row(
            base_prev,
            acc_score=acc_score,
            acc=abs(metrics.accuracy_score(label, pred) - acc_score),
            f1_score=f1_score,
            f1=abs(error.f1(true_prev) - f1_score),
        )

    report.fit_score = estimator.fit_score

    return report


def evaluate(
    c_model: BaseEstimator,
    validation: LabelledCollection,
    protocol: AbstractStochasticSeededProtocol,
    method: str,
    q_model: str,
    **kwargs,
):
    estimator: AccuracyEstimator = {
        "bin": BinaryQuantifierAccuracyEstimator,
        "mul": MulticlassAccuracyEstimator,
    }[method](c_model, q_model=q_model.upper(), **kwargs)
    estimator.fit(validation)
    _method = f"{method}_{q_model}"
    if "recalib" in kwargs:
        _method += f"_{kwargs['recalib']}"
    if ("gs", True) in kwargs.items():
        _method += "_gs"
    return evaluation_report(estimator, protocol, _method)


@method
def bin_sld(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "bin", "sld")


@method
def mul_sld(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "mul", "sld")


@method
def bin_sld_bcts(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "bin", "sld", recalib="bcts")


@method
def mul_sld_bcts(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "mul", "sld", recalib="bcts")


@method
def bin_sld_gs(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "bin", "sld", gs=True)


@method
def mul_sld_gs(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "mul", "sld", gs=True)


@method
def bin_cc(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "bin", "cc")


@method
def mul_cc(c_model, validation, protocol) -> EvaluationReport:
    return evaluate(c_model, validation, protocol, "mul", "cc")
diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`from functools import wraps`

plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`import numpy as np`
			`import sklearn.metrics as metrics`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`from quapy.data import LabelledCollection`
diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`from quapy.protocol import AbstractStochasticSeededProtocol`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`from sklearn.base import BaseEstimator`

			`import quacc.error as error`
			`from quacc.evaluation.report import EvaluationReport`

			`from ..estimator import (`
			`AccuracyEstimator,`
			`BinaryQuantifierAccuracyEstimator,`
			`MulticlassAccuracyEstimator,`
			`)`

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`_methods = {}`


			`def method(func):`
			`@wraps(func)`
			`def wrapper(c_model, validation, protocol):`
			`return func(c_model, validation, protocol)`

			`_methods[func.__name__] = wrapper`

			`return wrapper`

baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00
			`def estimate(`
			`estimator: AccuracyEstimator,`
			`protocol: AbstractStochasticSeededProtocol,`
			`):`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`base_prevs, true_prevs, estim_prevs, pred_probas, labels = [], [], [], [], []`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`for sample in protocol():`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`e_sample, pred_proba = estimator.extend(sample)`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`estim_prev = estimator.estimate(e_sample.X, ext=True)`
			`base_prevs.append(sample.prevalence())`
			`true_prevs.append(e_sample.prevalence())`
			`estim_prevs.append(estim_prev)`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`pred_probas.append(pred_proba)`
			`labels.append(sample.y)`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`return base_prevs, true_prevs, estim_prevs, pred_probas, labels`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00

			`def evaluation_report(`
			`estimator: AccuracyEstimator,`
			`protocol: AbstractStochasticSeededProtocol,`
			`method: str,`
			`) -> EvaluationReport:`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`base_prevs, true_prevs, estim_prevs, pred_probas, labels = estimate(`
			`estimator, protocol`
			`)`
			`report = EvaluationReport(name=method)`

			`for base_prev, true_prev, estim_prev, pred_proba, label in zip(`
			`base_prevs, true_prevs, estim_prevs, pred_probas, labels`
			`):`
			`pred = np.argmax(pred_proba, axis=-1)`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`acc_score = error.acc(estim_prev)`
			`f1_score = error.f1(estim_prev)`
			`report.append_row(`
Dataset refactored, training sampling added 2023-10-20 23:36:05 +02:00			`base_prev,`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`acc_score=acc_score,`
			`acc=abs(metrics.accuracy_score(label, pred) - acc_score),`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`f1_score=f1_score,`
Dataset refactored, training sampling added 2023-10-20 23:36:05 +02:00			`f1=abs(error.f1(true_prev) - f1_score),`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`)`

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`report.fit_score = estimator.fit_score`

baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`return report`


			`def evaluate(`
			`c_model: BaseEstimator,`
			`validation: LabelledCollection,`
			`protocol: AbstractStochasticSeededProtocol,`
			`method: str,`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`q_model: str,`
			`**kwargs,`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`):`
Dataset refactored, training sampling added 2023-10-20 23:36:05 +02:00			`estimator: AccuracyEstimator = {`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`"bin": BinaryQuantifierAccuracyEstimator,`
			`"mul": MulticlassAccuracyEstimator,`
diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`}[method](c_model, q_model=q_model.upper(), **kwargs)`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00			`estimator.fit(validation)`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`_method = f"{method}_{q_model}"`
diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`if "recalib" in kwargs:`
			`_method += f"_{kwargs['recalib']}"`
			`if ("gs", True) in kwargs.items():`
			`_method += "_gs"`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00			`return evaluation_report(estimator, protocol, _method)`
baselines refactored and updated, report updated 2023-10-19 02:36:53 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def bin_sld(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "bin", "sld")`
Dataset refactored, training sampling added 2023-10-20 23:36:05 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def mul_sld(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "mul", "sld")`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def bin_sld_bcts(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "bin", "sld", recalib="bcts")`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def mul_sld_bcts(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "mul", "sld", recalib="bcts")`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def bin_sld_gs(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "bin", "sld", gs=True)`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def mul_sld_gs(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "mul", "sld", gs=True)`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def bin_cc(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "bin", "cc")`
plots, avg table, conf added; method updated 2023-10-23 03:14:35 +02:00

diag plot fixed, opts, avg plot, best score added 2023-10-27 12:37:18 +02:00			`@method`
			`def mul_cc(c_model, validation, protocol) -> EvaluationReport:`
			`return evaluate(c_model, validation, protocol, "mul", "cc")`