Plotting

This module contains functions for plotting the results of the FACSIMILE procedure.

plotting

Functions:

plot_predictions –

Plot predicted scores against true scores.
plot_weights –

Plot a heatmap of a dataframe representing classifier weights.

plot_predictions

plot_predictions(true: ArrayLike, pred: ArrayLike, target_names: List[str] = None, scale: float = 1.0, fname: str = None, palette: List[str] = None, scatter_kws: Optional[Dict] = None, line_kws: Optional[Dict] = None, figure_kws: Optional[Dict] = None, ax: Axes = None)

Plot predicted scores against true scores.

Parameters:

true
(ArrayLike) –

True target variable scores.
pred
(ArrayLike) –

Predicted target variable scores.
target_names
(List[str], default: None ) –

List of target variable names. Defaults to None.
scale
(float, default: 1.0 ) –

Scale of the plot. Defaults to 1.0.
fname
(str, default: None ) –

Filename to save the plot to. Defaults to None.
palette
(List[str], default: None ) –

List of colours to use for each target. Defaults to None.
scatter_kws
(Optional[Dict], default: None ) –

Keyword arguments to pass to the scatter plot. Defaults to None.
line_kws
(Optional[Dict], default: None ) –

Keyword arguments to pass to the regression line. Defaults to None.
figure_kws
(Optional[Dict], default: None ) –

Keyword arguments to pass to the figure. Defaults to None.
ax
(Axes, default: None ) –

Axis to plot on. Defaults to None.

Source code in facsimile/plotting.py

def plot_predictions(
    true: ArrayLike,
    pred: ArrayLike,
    target_names: List[str] = None,
    scale: float = 1.0,
    fname: str = None,
    palette: List[str] = None,
    scatter_kws: Optional[Dict] = None,
    line_kws: Optional[Dict] = None,
    figure_kws: Optional[Dict] = None,
    ax: plt.Axes = None,
):
    """
    Plot predicted scores against true scores.

    Args:
        true (ArrayLike): True target variable scores.
        pred (ArrayLike): Predicted target variable scores.
        target_names (List[str], optional): List of target variable names.
            Defaults to `None`.
        scale (float, optional): Scale of the plot. Defaults to `1.0`.
        fname (str, optional): Filename to save the plot to. Defaults to
            `None`.
        palette (List[str], optional): List of colours to use for each target.
            Defaults to `None`.
        scatter_kws (Optional[Dict], optional): Keyword arguments to pass to
            the scatter plot. Defaults to `None`.
        line_kws (Optional[Dict], optional): Keyword arguments to pass to the
            regression line. Defaults to `None`.
        figure_kws (Optional[Dict], optional): Keyword arguments to pass to the
            figure. Defaults to `None`.
        ax (plt.Axes, optional): Axis to plot on. Defaults to `None`.
    """

    # Get number of targets
    n_targets = true.shape[1]

    # Make sure true and pred are numpy arrays
    true = np.array(true)
    pred = np.array(pred)

    # Check target variable names are correct length
    if target_names is not None:
        assert (
            len(target_names) == n_targets
        ), "Number of target variable names must equal number of targets"
    else:
        target_names = [
            "Variable {}".format(i + 1) for i in range(n_targets)
        ]

    # Set default figure and line keyword arguments if not provided
    if figure_kws is None:
        figure_kws = dict(
            figsize=((n_targets * 3.333) * scale, 3.5 * scale),
            dpi=100,
            facecolor="white",
        )
    if line_kws is None:
        line_kws = {}
    if scatter_kws is None:
        scatter_kws = dict(
            alpha=0.2,
            s=0.5,
        )

    # Set up figure
    if ax is None:
        f, ax = plt.subplots(
            1,
            n_targets,
            **figure_kws,
        )

        # If a single axis is returned, convert to array
        if not isinstance(ax, np.ndarray):
            ax = np.array([ax])

    else:
        # Make sure ax is the right length
        if not isinstance(ax, np.ndarray):
            ax = np.array([ax])
        assert (
            len(ax) == n_targets
        ), "Number of axes must equal number of targets"

    # If no palette is provided, use matplotlib default
    if palette is None:
        palette = [
            matplotlib.colors.to_hex(c)
            for c in plt.rcParams["axes.prop_cycle"].by_key()["color"]
        ]

    # If true is provided as a dataframe, convert to array
    if isinstance(true, pd.DataFrame):
        true = true.values

    # Plot each target variable
    for i in range(n_targets):
        ax[i].scatter(
            x=true[:, i], y=pred[:, i], color=palette[i], **scatter_kws
        )
        ax[i].set_title(
            target_names[i]
            + "\n$R^2$ = {0}".format(
                np.round(r2_score(true[:, i], pred[:, i]), 3)
            ),
        )

        # Add regression line
        ax[i].plot(
            np.unique(true[:, i]),
            np.poly1d(np.polyfit(true[:, i], pred[:, i], 1))(
                np.unique(true[:, i])
            ),
            color=palette[i],
            **line_kws,
        )

        ax[i].set_xlabel("True score")
        ax[i].set_ylabel("Predicted score")

        # Set axis limits based on values
        ax[i].set_xlim([np.min(true[:, i]), np.max(true[:, i])])
        ax[i].set_ylim([np.min(pred[:, i]), np.max(pred[:, i])])

        (diag_line,) = ax[i].plot(
            ax[i].get_xlim(), ax[i].get_ylim(), ls="--", color=palette[i]
        )

    plt.tight_layout()

    if fname is not None:
        plt.savefig(fname, dpi=300)

plot_weights

plot_weights(data: DataFrame, cmap: str = 'RdBu', colorbar_shrink: float = 1, colorbar_aspect: int = 5, figsize: tuple = None, vmin: float = None, vmax: float = None) -> None

Plot a heatmap of a dataframe representing classifier weights.

Parameters:

data
(DataFrame) –

The dataframe to plot.
cmap
(str, default: 'RdBu' ) –

The colormap to use for the heatmap. Defaults to 'viridis'.
colorbar_shrink
(float, default: 1 ) –

The size of the colorbar. Defaults to 1.
colorbar_aspect
(int, default: 5 ) –

Aspect ratio of the colorbar. Defaults to 20.
figsize
(tuple, default: None ) –

Figure size as (width, height). If None, a default size is determined based on the shape of the dataframe. Defaults to None.
vmin
(float, default: None ) –

Minimum value for the colormap. Defaults to None.
vmax
(float, default: None ) –

Maximum value for the colormap. Defaults to None.

Source code in facsimile/plotting.py

def plot_weights(
    data: pd.DataFrame,
    cmap: str = "RdBu",
    colorbar_shrink: float = 1,
    colorbar_aspect: int = 5,
    figsize: tuple = None,
    vmin: float = None,
    vmax: float = None,
) -> None:
    """
    Plot a heatmap of a dataframe representing classifier weights.

    Args:
        data (pd.DataFrame): The dataframe to plot.
        cmap (str): The colormap to use for the heatmap. Defaults to 'viridis'.
        colorbar_shrink (float): The size of the colorbar. Defaults to 1.
        colorbar_aspect (int): Aspect ratio of the colorbar. Defaults to 20.
        figsize (tuple): Figure size as (width, height). If None, a default
            size is determined based on the shape of the dataframe. Defaults
            to None.
        vmin (float): Minimum value for the colormap. Defaults to None.
        vmax (float): Maximum value for the colormap. Defaults to None.
    """

    # Drop intercept row and copy
    data = data.copy().drop("Intercept", axis=0).T

    # Get values as numpy array
    values = data.values

    # Calculate figure size if not specified
    if figsize is None:
        figsize = (values.shape[1] / 3, values.shape[0] / 3)

    # Create figure with specified size
    fig, ax = plt.subplots(figsize=figsize)
    cax = ax.matshow(values, cmap=cmap, vmin=vmin, vmax=vmax)

    # Add colorbar with shrink and aspect option
    fig.colorbar(
        cax, shrink=colorbar_shrink, aspect=colorbar_aspect, label="Weight"
    )

    # Set axis labels
    ax.set_xticks(np.arange(data.shape[1]))
    ax.set_yticks(np.arange(data.shape[0]))
    ax.set_xticklabels(data.columns)
    ax.set_yticklabels(data.index)

    # Set x and y labels
    plt.xlabel("Items")
    plt.ylabel("Targets")

    # Rotate x labels
    plt.xticks(rotation=45, ha="left")

    plt.show()

Plotting

plotting

plot_predictions

`true`

`pred`

`target_names`

`scale`

`fname`

`palette`

`scatter_kws`

`line_kws`

`figure_kws`

`ax`

plot_weights

`data`

`cmap`

`colorbar_shrink`

`colorbar_aspect`

`figsize`

`vmin`

`vmax`