Source code for multipac_testbench.util.plot

"""Define helper functions for plots."""

import itertools
import logging
import re
from abc import ABCMeta
from collections.abc import Collection, Iterable, Sequence
from pathlib import Path
from typing import Any, TypeVar, cast

import matplotlib
import matplotlib.cm as cm
import matplotlib.colors as mcolors
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
from matplotlib.axes import Axes
from matplotlib.figure import Figure
from matplotlib.typing import ColorType
from multipac_testbench.instruments.instrument import Instrument
from multipac_testbench.multipactor_test.loader import save
from multipac_testbench.threshold.threshold import PowerExtremum
from multipac_testbench.threshold.threshold_set import ThresholdSet
from multipac_testbench.util.helper import drop_repeated_col, is_nested_list
from multipac_testbench.util.multipactor_detectors import (
    start_and_end_of_contiguous_true_zones,
)
from numpy.typing import NDArray

T = TypeVar("T", bound=float)



[docs]
def plot_susceptibility_with_grad(
    df: pd.DataFrame,
    zcol: str,
    ax: Axes | None = None,
    xlim: tuple[float, float] | None = None,
    ylim: tuple[float, float] | None = None,
    ylabel: str | None = None,
    cmap: mcolors.Colormap | None = None,
    s: int = 5,
    **kwargs,
) -> Axes:
    """Draw ``lower`` and ``upper`` columns of ``df``. Use ``zcol`` for color.

    Parameters
    ----------
    df :
        Holds data to plot; must have columns with ``"lower"`` and ``"upper"``
        in their name.
    zcol :
        Column in ``df`` used to colour the markers.
    ax :
        To re-use a pre-existing axis.
    xlim, ylim :
        Plot limits.
    ylabel :
        Label for y-axis.
    cmap :
        Colour map to be used.
    s :
        Size for the markers.
    kwargs :
        Other keyword arguments passed to ``plt.scatter``.

    """
    if ax is None:
        _, ax = plt.subplots()

    n_dropped = df[zcol].isna().sum()
    if n_dropped:
        logging.warning(f"Dropped {n_dropped} rows with NaN in {zcol} column.")
        df = df.dropna(subset=[zcol])
    zdata = df[zcol].to_numpy()

    scatter_kwargs = {
        "norm": mcolors.Normalize(vmin=zdata.min(), vmax=zdata.max()),
        "cmap": cmap or matplotlib.colormaps.get_cmap("viridis"),
        "c": zdata,
        "x": df.index,
        "s": s,
    } | kwargs

    for col in df.filter(like="lower"):
        ax.scatter(y=df[col], marker="o", label=col, **scatter_kwargs)
    for col in df.filter(like="upper"):
        ax.scatter(y=df[col], marker="*", label=col, **scatter_kwargs)

    sm = cm.ScalarMappable(
        norm=scatter_kwargs["norm"], cmap=scatter_kwargs["cmap"]
    )
    sm.set_array([])
    ax.figure.colorbar(sm, ax=ax, label=zcol)

    if ylabel:
        ax.set_ylabel(ylabel)
    ax.legend()
    ax.grid(True)
    ax.set(xscale="log", yscale="log", xlim=xlim, ylim=ylim)
    return ax




[docs]
def plot_susceptibility_without_grad(
    df: pd.DataFrame,
    label_to_color: dict[str, ColorType],
    ax: Axes | None = None,
    xlim: tuple[float, float] | None = None,
    ylim: tuple[float, float] | None = None,
    ylabel: str | None = None,
    s: int = 5,
    **kwargs,
) -> Axes:
    """Draw ``lower`` and ``upper`` columns of ``df``.

    Parameters
    ----------
    df :
        Holds data to plot; must have columns with ``"lower"`` and ``"upper"``
        in their name.
    label_to_color :
        Maps column names with color to use.
    ax :
        To re-use a pre-existing axis.
    xlim, ylim :
        Plot limits.
    ylabel :
        Label for y-axis.
    s :
        Size for the markers.
    kwargs :
        Other keyword arguments passed to ``plt.scatter``.

    """
    if ax is None:
        _, ax = plt.subplots()

    scatter_kwargs = {
        "x": df.index,
        "s": s,
    } | kwargs

    for col in df.filter(like="lower"):
        ax.scatter(
            y=df[col],
            marker="o",
            label=col,
            c=label_to_color[str(col)],
            **scatter_kwargs,
        )
    for col in df.filter(like="upper"):
        ax.scatter(
            y=df[col],
            marker="*",
            label=col,
            c=label_to_color[str(col)],
            **scatter_kwargs,
        )

    if ylabel:
        ax.set_ylabel(ylabel)
    ax.legend()
    ax.grid(True)
    ax.set(xscale="log", yscale="log", xlim=xlim, ylim=ylim)
    return ax




[docs]
def attribute_to_color(
    attributes: Iterable[T],
) -> dict[T, tuple[float, float, float]]:
    """Map some attributes to colors.

    Used for example by :meth:`.TestCampaign.check_somersalo_scaling_law`, to
    always keep the same plot color for a given frequency.

    """
    prop_cycle = plt.rcParams["axes.prop_cycle"]
    colors = [c["color"] for c in prop_cycle]
    attr_to_color = {
        attr: colors[i % len(colors)]
        for i, attr in enumerate(sorted(attributes))
    }
    return attr_to_color




[docs]
def plot_extrema_markers(
    ax_by_position: dict[float, Axes] | Axes,
    instruments: list[Instrument],
    extrema: list[PowerExtremum],
    marker_style: dict[str, dict] | None = None,
    zorder: int = 3,
) -> None:
    """Plot PowerExtremum values as markers from all instruments.

    .. todo::
        Fill above/below the extrema.

    Parameters
    ----------
    ax_by_position :
        Axes (if same_figure=True) or dict mapping position to Axes.
    instruments :
        Instruments from which to extract values (must have `.data` and `.position`).
    extrema :
        Global PowerExtremum instances (with `.sample_index` and `.nature`).
    marker_style :
        Optional dict mapping nature ("minimum", "maximum") to plot kwargs
        (like color, marker shape, etc.).
    zorder :
        Layer order.

    """
    if isinstance(ax_by_position, dict):
        get_ax = lambda pos: ax_by_position[pos]
    else:
        get_ax = lambda pos: ax_by_position  # same figure

    marker_style = marker_style or {
        "minimum": dict(marker="v", linestyle="none", label="Minimum"),
        "maximum": dict(marker="^", linestyle="none", label="Maximum"),
    }

    for extremum in extrema:
        style = marker_style.get(extremum.nature, {})
        for instr in instruments:
            if extremum.sample_index >= len(instr.data):
                continue  # Skip if sample index is out of bounds
            x_val = extremum.sample_index
            y_val = instr.data[extremum.sample_index]
            ax = get_ax(instr.position)
            ax.plot(x_val, y_val, color=instr.color, **style, zorder=zorder)




[docs]
def create_fig(
    title: str = "",
    instruments_to_plot: Sequence[ABCMeta] = (),
    xlabel: str | None = None,
    subplot_kw: dict | None = None,
    **fig_kw,
) -> tuple[Figure, dict[ABCMeta, Axes]]:
    """Create the figure and axes.

    Parameters
    ----------
    instruments_to_plot :
        Class of the instruments to be plotted.
    fig_kw :
        Keyword arguments passsed to the Figure constructor.

    Returns
    -------

        Figure holding the axes.

        Dictionary linking the class of the instruments to plot with the
        associated axes.

    """
    fig = plt.figure(**fig_kw)

    if subplot_kw is None:
        subplot_kw = {}
    nrows = len(instruments_to_plot)
    instrument_class_axes = _create_axes(
        instruments_to_plot, fig, nrows, xlabel, **subplot_kw
    )

    if len(title) > 0:
        fig.suptitle(title)
    return fig, instrument_class_axes




[docs]
def _create_axes(
    instruments_to_plot: Sequence[ABCMeta],
    fig: Figure,
    nrows: int,
    xlabel: str | None = None,
    **subplot_kw,
) -> dict[ABCMeta, Axes]:
    """Create the axes."""
    axes = []
    sharex = None
    for row in range(nrows):
        axe = fig.add_subplot(nrows, 1, row + 1, sharex=sharex, **subplot_kw)
        axes.append(axe)
        sharex = axes[0]

    if xlabel is not None:
        axes[-1].set_xlabel(xlabel)

    instrument_class_axes = dict(zip(instruments_to_plot, axes))

    axe = None
    for instrument_class, axe in instrument_class_axes.items():
        axe.grid(True)
        ylabel = getattr(instrument_class, "ylabel", lambda: "default")()
        axe.set_ylabel(ylabel)
    return instrument_class_axes




[docs]
def finish_fig(
    fig: Figure,
    axes: Iterable[Axes],
    png_path: Path | None = None,
) -> tuple[Figure, list[Axes]]:
    """Save the figure, create the legend."""
    axes = [axe for axe in axes]
    for axe in axes:
        axe.legend()

    if png_path is not None:
        fig.savefig(png_path)

    return fig, axes




[docs]
def create_df_to_plot(
    data_to_plot: Sequence[pd.Series | pd.DataFrame],
    head: int | None = None,
    tail: int | None = None,
    column_names: str | list[str] = "",
    drop_repeated_x: bool = False,
    **kwargs,
) -> pd.DataFrame:
    """Merge the series into a single dataframe.

    Parameters
    ----------
    data_to_plot :
        List of the data that will be plotted.
    head :
        Plot only the first ``head`` rows.
    tail :
        Plot only the last ``tail`` rows.
    column_names :
        To override the default column names. This is used in particular with
        the method :meth:`.TestCampaign.sweet_plot` when
        ``all_on_same_plot=True``.
    drop_repeated_x :
        If True, remove consecutive rows with identical x values.
    kwargs :
        Other keyword arguments.

    Returns
    -------
        Contains x and y data that will be plotted.

    """
    lengths = [len(item) for item in data_to_plot]
    if len(set(lengths)) > 1:
        logging.warning(
            f"Not all data sources have the same length: {lengths}"
        )
    df_to_plot = pd.concat(data_to_plot, axis=1)

    if head is not None:
        df_to_plot = df_to_plot.head(head)
    if tail is not None:
        df_to_plot = df_to_plot.tail(tail)

    # Remove duplicate columns
    df_to_plot = df_to_plot.loc[:, ~df_to_plot.columns.duplicated()].copy()

    if drop_repeated_x:
        df_to_plot = drop_repeated_col(df_to_plot)

    if not column_names:
        return df_to_plot

    if isinstance(column_names, str):
        column_names = [column_names]

    old_column_names = df_to_plot.columns.values
    assert len(column_names) == len(old_column_names)
    columns_mapper = {
        old: new for old, new in zip(old_column_names, column_names)
    }
    df_to_plot.rename(columns=columns_mapper, inplace=True)

    return df_to_plot




[docs]
def match_x_and_y_column_names(
    x_columns: list[str] | None,
    y_columns: list[list[str]] | list[list[list[str]]],
) -> tuple[list[str] | str | None, list[list[str]] | list[str]]:
    """Match name of x columns with y columns, remove duplicate columns.

    Parameters
    ----------
    x_columns :
        Name of the instrument(s) used as x-axis.
    y_columns :
        Name of the instruments for y-axis, sorted by subplot. It can be
        3-level nested list, in particular when we separate data between
        increasing and decreasing power values.

    Returns
    -------
        Name of the instrument(s) used as x-axis. Three possibilities:

        - If it is None, we plot again sample index.
        - If it is a single :class:`.Instrument` name, it will be used as
          x-data for every plot.
        - If it is a list of names, its length matches the length of
          ``y_columns``. This is typically what happens when we plot an
          instrument vs another.

        Name of the instruments for y-axis.

    """
    # One or several instrument types plotted vs Sample index
    if x_columns is None:
        # None, list[str]
        return x_columns, y_columns

    # One or several instruments types plotted vs another single instrument
    if len(x_columns) == 1:
        x_column = x_columns[0]

        for y_column in y_columns:
            if x_column in y_column:
                y_column.remove(x_column)
        # str, list[str] | list[list[str]]
        return x_column, y_column

    # One instrument type plotted vs another instrument type
    # number of instruments should match
    x_column = x_columns
    y_column = y_columns[0]
    assert len(x_column) == len(y_column)
    # list[str], list[list[str]]
    return x_column, y_column




[docs]
def actual_plot(
    df_to_plot: pd.DataFrame,
    x_columns: list[str] | str | None,
    y_columns: list[list[str]] | list[str],
    axes: list[Axes],
    grid: bool = True,
    sharex: bool | None = True,
    color: dict[str, str] | None = None,
    **kwargs,
) -> list[Axes]:
    """Plot the data, adapting to what is given.

    Parameters
    ----------
    df_to_plot :
        Containts all the data that will be plotted.
    x_columns :
        Name of the column(s) used for x axis.
    y_columns :
        Name of the column(s) for y plot. If ``list`` of ``list``, each sublist
        is a subplot.
    axes :
        Axes to plot on.
    grid :
        If the grid should be plotted.
    sharex :
        To let the different subplots share the same x-axis. It is set to None
        when we re-use already existing Axes.
    color :
        Dictionary linking column names in ``df_to_plot`` to HTML colors. Used
        to keep the same color between different instruments at the same
        :class:`.PickUp`.
    kwargs :
        Other keyword arguments passed to the plot function.

    Returns
    -------
        Plotted axes, or an array containing them.

    """
    if is_nested_list(y_columns):
        y_columns_nested = cast(list[list[str]], y_columns)
        styles = [styles_from_column_cycle(y) for y in y_columns_nested]
    else:
        y_columns_flat = cast(list[str], y_columns)
        styles = [styles_from_column_cycle(col) for col in y_columns_flat]

    if not isinstance(x_columns, list):
        x_columns = [x_columns for _ in y_columns]

    assert isinstance(x_columns, list)

    if len(x_columns) != len(y_columns):
        logging.error(
            f"Mismatch between the length of {x_columns = } and {y_columns = }"
        )

    if len(axes) == 1:
        axes = [axes[0] for _ in y_columns]

    for x, y, ax, style_dict in zip(
        x_columns, y_columns, axes, styles, strict=True
    ):
        if not isinstance(y, list):
            y = [y]
        style_list = [
            style_dict.get(col, {"linestyle": "-"}).get("linestyle", "-")
            for col in y
        ]

        df_to_plot.plot(
            x=x,
            y=y,
            sharex=sharex,
            grid=grid,
            ax=ax,
            color=color,
            style=style_list,
            **kwargs,
        )
    return axes




[docs]
def set_labels(
    axes: Collection[Axes] | Axes,
    *ydata: ABCMeta,
    xdata: ABCMeta | None = None,
    xlabel: str = "",
    ylabel: str | Iterable = "",
    **kwargs,
) -> None:
    """Set proper ylabel for every subplot.

    Parameters
    ----------
    axes :
        Axes.
    *ydata :
        Class of the plotted instruments.
    xdata :
        Class of the x-data instrument if applicable.
    xlabel :
        Label used for x axis. If not given, we take ``ylabel`` attribute
        from ``xdata``.
    ylabel :
        Labels that will be given for every subplot. If not given, we take
        the ``ylabel`` attribute of every plotted class.
    kwargs :
        kwargs

    """
    if not xlabel:
        if xdata is not None:
            xlabel = xdata.ylabel()
        else:
            xlabel = "Sample index"

    if isinstance(axes, Axes):
        axes = (axes,)

    if not ylabel:
        ylabel = (obj.ylabel() for obj in ydata)
    if isinstance(ylabel, str):
        ylabel = (ylabel,)

    for ax, ylab in zip(axes, ylabel):
        if isinstance(ylab, tuple) and len(ylab) == 2:
            # Directional labels: plot both with arrows
            ax.set_ylabel(f"{ylab[0]} (↑)\n{ylab[1]} (↓)")
        else:
            ax.set_ylabel(str(ylab))

        if xlabel:
            ax.set_xlabel(xlabel)




[docs]
def save_figure(
    axes: Axes | list[Axes],
    png_path: Path,
    verbose: bool = False,
    **png_kwargs,
) -> None:
    """Save the figure.

    Parameters
    ----------
    axes :
        Holds one or several axes.
    png_path :
        Where figure shall be saved.
    verbose :
        To print a message indicating where Figure is saved.
    **png_kwargs :
        Keyword arguments for the ``Figure.savefig`` method.

    """
    if isinstance(axes, (np.ndarray, list)):
        fig = axes[0].get_figure()
    else:
        fig = axes.get_figure()
    assert isinstance(fig, Figure)
    fig.savefig(png_path, **png_kwargs)
    if verbose:
        logging.info(f"Figure saved @ {png_path = }")




[docs]
def save_dataframe(
    df_to_plot: pd.DataFrame,
    csv_path: Path,
    sep: str = ",",
    verbose: bool = False,
    **csv_kwargs,
) -> None:
    r"""Save dataframe used to produce the plot.

    Parameters
    ----------
    df_to_plot :
        DataFrame to save.
    csv_path :
        Where to save DataFrame.
    sep :
        Column delimiter.
    verbose :
        To print a message indicating where Figure is saved.
    csv_kwargs :
        Other keyword arguments for the ``DataFrame.to_csv`` method.

    """
    save(
        csv_path,
        df_to_plot,
        info="plotted data",
        sep=sep,
        verbose=verbose,
        **csv_kwargs,
    )




[docs]
def add_background_color_according_to_power_growth(
    axe: Axes | Sequence[Axes] | NDArray[Axes],
    growth_mask: NDArray[np.bool],
    grow_kw: dict | None = None,
    decrease_kw: dict | None = None,
    legend: bool = True,
) -> None:
    """Add a background color to indicate where power grows or not.

    Parameters
    ----------
    axe :
        The Axes on which to plot. If several are given, we sequentially call
        this function.
    growth_mask :
        A list containing True where power grows, False where decreases, np.nan
        when undetermined. Typical return value from
        :meth:`.ForwardPower.growth_mask`.
    grow_kw :
        How zones where power grows are colored. Default is a semi-transparent
        blue.
    decrease_kw :
        How zones where power decreases are colored. Default is a
        semi-transparent red.
    legend :
        If legend should be added.

    """
    if isinstance(axe, (Sequence, np.ndarray)):
        for ax in axe:
            add_background_color_according_to_power_growth(
                ax, growth_mask, grow_kw, decrease_kw, legend
            )
        return
    as_array = np.array(growth_mask)

    if grow_kw is None:
        grow_kw = {"color": "b", "alpha": 0.2}
    _add_single_bg_color(
        as_array, axe, "Power grows", invert_array=False, **grow_kw
    )

    if decrease_kw is None:
        decrease_kw = {"color": "r", "alpha": 0.2}
    _add_single_bg_color(
        as_array, axe, "Power decreases", invert_array=True, **decrease_kw
    )

    if legend:
        axe.legend()




[docs]
def _add_single_bg_color(
    growth_mask: NDArray[np.bool],
    axe: Axes,
    label: str | None,
    invert_array: bool,
    **color_kw: dict,
) -> None:
    """Add a single background color to the plot.

    Parameters
    ----------
    growth_mask :
        Array where 1. means power grows, 0. means it decreases, np.nan is
        undetermined.
    axe :
        Where color should be plotted.
    label :
        The label of the background color.
    invert_array :
        Should be False for grow plot, True for decrease plot. Serve as a
        filling value for nan.
    color_kw :
        Keyword arguments given to axvspan.

    """
    growth_mask[np.isnan(growth_mask)] = invert_array
    data = growth_mask.astype(np.bool_)
    if invert_array:
        data = ~data
    zones = start_and_end_of_contiguous_true_zones(data)
    for zone in zones:
        axe.axvspan(zone[0], zone[1], label=label, **color_kw)
        label = None




[docs]
def add_thresholds(
    threshold_set: ThresholdSet,
    axes: list[Axes] | Axes | None = None,
    scale: float = 1.0,
    alpha: float = 0.5,
    legend: bool = True,
    twinx: bool = False,
    **kwargs,
) -> Axes | list[Axes]:
    """Add the thresholds position to a pre-existing plot."""
    raise NotImplementedError("This is deprecated I think.")
    if isinstance(axes, list):
        axes_aslist = [
            add_instrument_multipactor_bands(
                test_multipactor_bands,
                axe,
                scale=scale,
                alpha=alpha,
                legend=legend,
                twinx=twinx,
                **kwargs,
            )
            for axe in axes
        ]
        return axes_aslist

    mp_axes = axes
    if twinx:
        assert axes is not None
        mp_axes = axes.twinx()

    mp_axes = test_multipactor_bands.plot_as_bool(
        mp_axes, scale, alpha, legend, **kwargs
    )
    if legend:
        assert axes is not None
        _merge_legends(axes, mp_axes)
    return mp_axes




[docs]
def plot_df_threshold(
    df: pd.DataFrame,
    ylabel: str,
    label_to_color: dict[str, tuple[float, float, float]],
    fig_title: str,
    xticks: Sequence[float],
    ms: int = 8,
    lw: float = 0.0,
    axes: Axes | None = None,
    plot_kwargs: dict[str, Any] | None = None,
    **kwargs,
) -> Axes:
    """Plot a threshold dataframe, separating lower/upper thresholds.

    If no lower threshold is found, an error message is printed; we try to
    continue exectution anyway.
    If no upper threshold is found, there is no problem.

    Parameters
    ----------
    df :
        Holds ``"{Instrument.name} lower"`` and ``"{Instrument.name}
        upper"`` columns.
    ylabel :
        Y label.
    label_to_color :
        Maps threshold dataframe column names with a color.
    fig_title :
        Figure title.
    xticks :
        Position of xticks. A common choice is the position of power extrema.
    ms :
        Markers size.
    axes :
        To re-use pre-existing axis.
    plot_kwargs :
        Kwargs passed to the plotting function.

    """
    lower = df.filter(like="lower")
    if lower.empty:
        logging.error(f"No lower threshold to plot was found.\n{df}")
        assert (
            axes is not None
        ), "You must provide `axes` kwarg to continue execution anyway."
        return axes

    axes = lower.plot(
        marker="o",
        ms=ms,
        grid=True,
        ylabel=ylabel,
        title=fig_title,
        color=[label_to_color[col] for col in lower.columns],
        ax=axes,
        lw=lw,
        xticks=xticks,
        **(plot_kwargs or {}),
    )
    assert axes is not None
    axes.set_prop_cycle(None)

    upper = df.filter(like="upper")
    if upper.empty:
        return axes

    axes = upper.plot(
        marker="*",
        ms=ms,
        grid=True,
        ylabel=ylabel,
        title=fig_title,
        color=[label_to_color[col] for col in upper.columns],
        ax=axes,
        lw=lw,
        xticks=xticks,
        **(plot_kwargs or {}),
    )
    assert axes is not None
    return axes




[docs]
def _merge_legends(ax1: Axes, ax2: Axes) -> None:
    """Move the legend from ``ax1`` to ``ax2``."""
    handles1, labels1 = ax1.get_legend_handles_labels()
    handles2, labels2 = ax2.get_legend_handles_labels()
    handles = handles1 + handles2
    labels = labels1 + labels2
    ax1.legend().remove()
    ax2.legend(handles, labels)




[docs]
def styles_from_column_cycle(
    columns: Iterable[str],
    linestyles: list[str] | None = None,
) -> dict[str, dict[str, str]]:
    """Assign line styles to columns based on their suffixes for plotting.

    Columns are expected to follow the naming convention produced by masking
    with suffixes, where each column name has the form
    ``"<base_name>__<suffix>"``. The part after the double underscore is used
    to distinguish the masked variants of the same base column.

    Line styles are cycled through for each unique suffix across columns
    sharing the same base name.

    Parameters
    ----------
    columns :
        The column names to assign styles to. Must follow the
        ``"<base_name>__<suffix>"`` convention.
    linestyles :
        The list of line styles to cycle through (e.g.,
        ``['-', '--', ':', '-.']``).

    Returns
    -------
        A dictionary mapping each column name to a dictionary with a
        ``"linestyle"`` key, e.g.,
        ``{'col__a': {'linestyle': '-'}, 'col__b': {'linestyle': '--'}}``.

    """

    if linestyles is None:
        linestyles = ["-", "--", "-.", ":"]

    base_to_columns: dict[str, list[str]] = {}
    for col in columns:
        base = re.split(r"__|\(|\[", col)[0]
        base_to_columns.setdefault(base, []).append(col)

    style_map = {}
    for base, cols in base_to_columns.items():
        cycle = itertools.cycle(linestyles)
        for col in sorted(cols):  # Sort for consistent ordering
            style_map[col] = {"linestyle": next(cycle)}

    return style_map




[docs]
def default_ylabel() -> str:
    """Produce a default y-label."""
    return "???"