plots refactoring started

2024-04-04 17:03:52 +02:00 · 2024-04-04 17:03:52 +02:00 · b8e43c02f2
parent 4a06c83256
commit b8e43c02f2
2 changed files with 189 additions and 302 deletions
--- a/quacc/plot/init.py
+++ b/quacc/plot/init.py
@ -1,7 +1,7 @@
-from quacc.plot.plot import (
+from quacc.legacy.plot.plot import (
    get_backend,
    plot_delta,
    plot_diagonal,
    plot_shift,
    plot_fit_scores,
    plot_shift,
 )
--- a/quacc/plot/plotly.py
+++ b/quacc/plot/plotly.py
@ -1,78 +1,49 @@
-from collections import defaultdict
+import os
 from pathlib import Path
 import numpy as np
 import plotly
 import plotly.graph_objects as go
-from quacc.evaluation.estimators import CE, _renames
+MODE = "lines"
-from quacc.plot.base import BasePlot
+L_WIDTH = 5
-
+LEGEND = {
-
+    "font": {
-class PlotCfg:
+        "family": "DejaVu Sans",
-    def __init__(self, mode, lwidth, font=None, legend=None, template="seaborn"):
+        "size": 24,
        self.mode = mode
        self.lwidth = lwidth
        self.legend = {} if legend is None else legend
        self.font = {} if font is None else font
        self.template = template
 web_cfg = PlotCfg("lines+markers", 2)
 png_cfg_old = PlotCfg(
    "lines",
    5,
    legend=dict(
        orientation="h",
        yanchor="bottom",
        xanchor="right",
        y=1.02,
        x=1,
        font=dict(size=24),
    ),
    font=dict(size=24),
    # template="ggplot2",
 )
 png_cfg = PlotCfg(
    "lines",
    5,
    legend=dict(
        font=dict(
            family="DejaVu Sans",
            size=24,
        ),
    ),
    font=dict(size=24),
    # template="ggplot2",
 )
 _cfg = png_cfg
 class PlotlyPlot(BasePlot):
    __themes = defaultdict(
        lambda: {
            "template": _cfg.template,
    }
 }
 FONT = {"size": 24}
 TEMPLATE = "ggplot2"
 def _save_or_return(fig, basedir, dataset_name, measure_name, plot_type):
    if basedir is not None:
        plotsubdir = dataset_name
        os.path.join(basedir, "plots", measure_name, plotsubdir, plot_type + ".svg")
    return fig
 def _update_layout(fig, title, x_label, y_label, **kwargs):
    fig.update_layout(
        xaxis_title=x_label,
        yaxis_title=y_label,
        template=TEMPLATE,
        font=FONT,
        legend=LEGEND,
        **kwargs,
    )
    __themes = __themes | {
        "dark": {
            "template": "plotly_dark",
        },
    }
    def __init__(self, theme=None):
        self.theme = PlotlyPlot.__themes[theme]
        self.rename = True
-    def hex_to_rgb(self, hex: str, t: float | None = None):
+def _hex_to_rgb(self, hex: str, t: float | None = None):
    hex = hex.lstrip("#")
    rgb = [int(hex[i : i + 2], 16) for i in [0, 2, 4]]
    if t is not None:
        rgb.append(t)
    return f"{'rgb' if t is None else 'rgba'}{str(tuple(rgb))}"
-    def get_colors(self, num):
+
 def _get_colors(self, num):
    match num:
        case v if v > 10:
            __colors = plotly.colors.qualitative.Light24
@ -86,156 +57,45 @@ class PlotlyPlot(BasePlot):
    return __generator(__colors)
    def update_layout(self, fig, title, x_label, y_label):
        fig.update_layout(
            # title=title,
            xaxis_title=x_label,
            yaxis_title=y_label,
            template=self.theme["template"],
            font=_cfg.font,
            legend=_cfg.legend,
        )
-    def save_fig(self, fig, base_path, title) -> Path:
+def _get_ref_limits(true_accs: np.ndarray, estim_accs: dict[str, np.ndarray]):
-        return None
+    """get lmits of reference line"""
    def rename_plots(
        self,
        columns,
    ):
        if not self.rename:
            return columns
        new_columns = []
        for c in columns:
            nc = c
            for old, new in _renames.items():
                if c.startswith(old):
                    nc = new + c[len(old) :]
            new_columns.append(nc)
        return np.array(new_columns)
    def plot_delta(
        self,
        base_prevs,
        columns,
        data,
        *,
        stdevs=None,
        pos_class=1,
        title="default",
        x_label="prevs.",
        y_label="error",
        legend=True,
    ) -> go.Figure:
        fig = go.Figure()
        if isinstance(base_prevs[0], float):
            base_prevs = np.around([(1 - bp, bp) for bp in base_prevs], decimals=4)
        x = [str(tuple(bp)) for bp in base_prevs]
        named_data = {c: d for c, d in zip(columns, data)}
        r_columns = {c: r for c, r in zip(columns, self.rename_plots(columns))}
        line_colors = self.get_colors(len(columns))
        # for name, delta in zip(columns, data):
        columns = np.array(CE.name.sort(columns))
        for name in columns:
            delta = named_data[name]
            r_name = r_columns[name]
            color = next(line_colors)
            _line = [
                go.Scatter(
                    x=x,
                    y=delta,
                    mode=_cfg.mode,
                    name=r_name,
                    line=dict(color=self.hex_to_rgb(color), width=_cfg.lwidth),
                    hovertemplate="prev.: %{x}<br>error: %{y:,.4f}",
                )
            ]
            _error = []
            if stdevs is not None:
                _col_idx = np.where(columns == name)[0]
                stdev = stdevs[_col_idx].flatten()
                _error = [
                    go.Scatter(
                        x=np.concatenate([x, x[::-1]]),
                        y=np.concatenate([delta - stdev, (delta + stdev)[::-1]]),
                        name=int(_col_idx[0]),
                        fill="toself",
                        fillcolor=self.hex_to_rgb(color, t=0.2),
                        line=dict(color="rgba(255, 255, 255, 0)"),
                        hoverinfo="skip",
                        showlegend=False,
                    )
                ]
            fig.add_traces(_line + _error)
        self.update_layout(fig, title, x_label, y_label)
        return fig
    def plot_diagonal(
        self,
        reference,
        columns,
        data,
        *,
        pos_class=1,
        title="default",
        x_label="true",
        y_label="estim.",
        fixed_lim=False,
        legend=True,
    ) -> go.Figure:
        fig = go.Figure()
        x = reference
        line_colors = self.get_colors(len(columns))
        if fixed_lim:
            _lims = np.array([[0.0, 1.0], [0.0, 1.0]])
        else:
    _edges = (
-                np.min([np.min(x), np.min(data)]),
+        np.min([np.min(true_accs), np.min(estim_accs)]),
-                np.max([np.max(x), np.max(data)]),
+        np.max([np.max(true_accs), np.max(estim_accs)]),
    )
    _lims = np.array([[_edges[0], _edges[1]], [_edges[0], _edges[1]]])
-        named_data = {c: d for c, d in zip(columns, data)}
+
-        r_columns = {c: r for c, r in zip(columns, self.rename_plots(columns))}
+def plot_diagonal(
-        columns = np.array(CE.name.sort(columns))
+    method_names,
-        for name in columns:
+    true_accs,
-            val = named_data[name]
+    estim_accs,
-            r_name = r_columns[name]
+    *,
    measure_name="vanilla_accuracy",
    dataset_name=None,
    basedir=None,
 ) -> go.Figure:
    fig = go.Figure()
    x = true_accs
    line_colors = _get_colors(len(method_names))
    _lims = _get_ref_limits(true_accs, estim_accs)
    for name, estim in zip(method_names, estim_accs):
        color = next(line_colors)
-            slope, interc = np.polyfit(x, val, 1)
+        slope, interc = np.polyfit(x, estim, 1)
            # y_lr = np.array([slope * _x + interc for _x in _lims[0]])
        fig.add_traces(
            [
                go.Scatter(
                    x=x,
-                        y=val,
+                    y=estim,
-                        customdata=np.stack((val - x,), axis=-1),
+                    customdata=np.stack((estim - x,), axis=-1),
                    mode="markers",
-                        name=r_name,
+                    name=name,
-                        marker=dict(color=self.hex_to_rgb(color, t=0.5)),
+                    marker=dict(color=_hex_to_rgb(color, t=0.5)),
                    hovertemplate="true acc: %{x:,.4f}<br>estim. acc: %{y:,.4f}<br>acc err.: %{customdata[0]:,.4f}",
                        # showlegend=False,
                ),
                    # go.Scatter(
                    #     x=[x[-1]],
                    #     y=[val[-1]],
                    #     mode="markers",
                    #     marker=dict(color=self.hex_to_rgb(color), size=8),
                    #     name=r_name,
                    # ),
                    # go.Scatter(
                    #     x=_lims[0],
                    #     y=y_lr,
                    #     mode="lines",
                    #     name=name,
                    #     line=dict(color=self.hex_to_rgb(color), width=3),
                    #     showlegend=False,
                    # ),
            ]
        )
    fig.add_trace(
@ -245,12 +105,14 @@ class PlotlyPlot(BasePlot):
            mode="lines",
            name="reference",
            showlegend=False,
-                line=dict(color=self.hex_to_rgb("#000000"), dash="dash"),
+            line=dict(color=_hex_to_rgb("#000000"), dash="dash"),
        )
    )
-        self.update_layout(fig, title, x_label, y_label)
+    _update_layout(
-        fig.update_layout(
+        fig,
        x_label=f"True {measure_name}",
        y_label=f"Estimated {measure_name}",
        autosize=False,
        width=1300,
        height=1000,
@ -258,73 +120,98 @@ class PlotlyPlot(BasePlot):
        yaxis_scaleratio=1.0,
        yaxis_range=[-0.1, 1.1],
    )
-        return fig
+    return _save_or_return(fig, basedir, dataset_name, measure_name, "diagonal")
-    def plot_shift(
+
-        self,
+def plot_delta(
-        shift_prevs,
+    method_names: list[str],
-        columns,
+    prevs: np.ndarray,
-        data,
+    acc_errs: np.ndarray,
    *,
-        counts=None,
+    stdevs: np.ndarray | None = None,
-        pos_class=1,
+    prev_name="Test",
-        title="default",
+    measure_name="Vanilla Accuracy",
-        x_label="true",
+    dataset_name=None,
-        y_label="estim.",
+    basedir=None,
-        legend=True,
+) -> go.Figure:
    ) -> go.Figure:
    fig = go.Figure()
-        # x = shift_prevs[:, pos_class]
+    x = [str(bp) for bp in prevs]
-        x = shift_prevs
+    line_colors = _get_colors(len(method_names))
-        line_colors = self.get_colors(len(columns))
+    if stdevs is None:
-        named_data = {c: d for c, d in zip(columns, data)}
+        stdevs = [None] * len(method_names)
-        r_columns = {c: r for c, r in zip(columns, self.rename_plots(columns))}
+    for name, delta, stdev in zip(method_names, acc_errs, stdevs):
-        columns = np.array(CE.name.sort(columns))
+        color = next(line_colors)
-        for name in columns:
+        _line = [
-            delta = named_data[name]
+            go.Scatter(
-            r_name = r_columns[name]
+                x=x,
-            col_idx = (columns == name).nonzero()[0][0]
+                y=delta,
                mode=MODE,
                name=name,
                line=dict(color=_hex_to_rgb(color), width=L_WIDTH),
                hovertemplate="prev.: %{x}<br>error: %{y:,.4f}",
            )
        ]
        _error = []
        if stdev is not None:
            _error = [
                go.Scatter(
                    x=np.concatenate([x, x[::-1]]),
                    y=np.concatenate([delta - stdev, (delta + stdev)[::-1]]),
                    name=name,
                    fill="toself",
                    fillcolor=_hex_to_rgb(color, t=0.2),
                    line=dict(color="rgba(255, 255, 255, 0)"),
                    hoverinfo="skip",
                    showlegend=False,
                )
            ]
        fig.add_traces(_line + _error)
    _update_layout(
        fig,
        x_label=f"{prev_name} Prevalence",
        y_label=f"Prediction Error for {measure_name}",
    )
    return _save_or_return(
        fig, basedir, dataset_name, measure_name, "delta" if stdevs is None else "stdev"
    )
 def plot_shift(
    method_names: list[str],
    prevs: np.ndarray,
    acc_errs: np.ndarray,
    *,
    counts: np.ndarray | None = None,
    measure_name="Vanilla Accuracy",
    dataset_name=None,
    basedir=None,
 ) -> go.Figure:
    fig = go.Figure()
    x = prevs
    line_colors = _get_colors(len(method_names))
    if counts is None:
        counts = [None] * len(method_names)
    for name, delta, count in zip(method_names, acc_errs, counts):
        color = next(line_colors)
        fig.add_trace(
            go.Scatter(
                x=x,
                y=delta,
-                    customdata=np.stack((counts[col_idx],), axis=-1),
+                customdata=np.stack((count,), axis=-1),
-                    mode=_cfg.mode,
+                mode=MODE,
-                    name=r_name,
+                name=name,
-                    line=dict(color=self.hex_to_rgb(color), width=_cfg.lwidth),
+                line=dict(color=_hex_to_rgb(color), width=L_WIDTH),
                hovertemplate="shift: %{x}<br>error: %{y}"
                + "<br>count: %{customdata[0]}"
-                    if counts is not None
+                if count is not None
                else "",
            )
        )
-        self.update_layout(fig, title, x_label, y_label)
+    _update_layout(
-        return fig
+        fig,
-
+        x_label="Amount of Prior Probability Shift",
-    def plot_fit_scores(
+        y_label=f"Prediction Error for {measure_name}",
        self,
        train_prevs,
        scores,
        *,
        pos_class=1,
        title="default",
        x_label="prev.",
        y_label="position",
        legend=True,
    ) -> go.Figure:
        fig = go.Figure()
        # x = train_prevs
        x = [str(tuple(bp)) for bp in train_prevs]
        fig.add_trace(
            go.Scatter(
                x=x,
                y=scores,
                mode="lines+markers",
                showlegend=False,
            ),
    )
-
+    return _save_or_return(fig, basedir, dataset_name, measure_name, "shift")
        self.update_layout(fig, title, x_label, y_label)
        return fig