arviz-devs · aloctavodia · Jan 26, 2025 · Nov 15, 2024 · Nov 18, 2024 · Nov 18, 2024
diff --git a/docs/source/gallery/inference_diagnostics/plot_convergence_dist.py b/docs/source/gallery/inference_diagnostics/plot_convergence_dist.py
@@ -0,0 +1,25 @@
+"""
+# Convergence diagnostics distribution plot
+
+Plot the distribution of ESS and R-hat.
+
+---
+
+:::{seealso}
+API Documentation: {func}`~arviz_plots.plot_ess`
+:::
+"""
+
+from arviz_base import load_arviz_data
+
+import arviz_plots as azp
+
+azp.style.use("arviz-clean")
+
+data = load_arviz_data("radon")
+pc = azp.plot_convergence_dist(data,
+                               var_names=["za_county"],
+                               backend="none",  # change to preferred backend
+)
+
+pc.show()
diff --git a/src/arviz_plots/plots/__init__.py b/src/arviz_plots/plots/__init__.py
@@ -1,6 +1,7 @@
 """Batteries-included ArviZ plots."""
 
 from .compareplot import plot_compare
+from .convergencedistplot import plot_convergence_dist
 from .distplot import plot_dist
 from .energyplot import plot_energy
 from .essplot import plot_ess
@@ -13,6 +14,7 @@
 
 __all__ = [
     "plot_compare",
+    "plot_convergence_dist",
     "plot_dist",
     "plot_forest",
     "plot_trace",

diff --git a/src/arviz_plots/plots/convergencedistplot.py b/src/arviz_plots/plots/convergencedistplot.py
@@ -0,0 +1,202 @@
+"""Convergence diagnostic distribution plot code."""
+import warnings
+
+from arviz_base import convert_to_dataset, rcParams
+
+from arviz_plots.plots.distplot import plot_dist
+from arviz_plots.plots.utils import process_group_variables_coords
+
+
+def plot_convergence_dist(
+    dt,
+    diagnostics=None,
+    ref_line=True,
+    var_names=None,
+    filter_vars=None,
+    group="posterior",
+    coords=None,
+    sample_dims=None,
+    kind="ecdf",
+    point_estimate=None,
+    ci_kind=None,
+    ci_prob=None,
+    plot_collection=None,
+    backend=None,
+    labeller=None,
+    aes_map=None,
+    plot_kwargs=None,
+    stats_kwargs=None,
+    pc_kwargs=None,
+):
+    """Plot the distribution of convergence diagnostics (ESS and/or R-hat).
+
+    Parameters
+    ----------
+    dt : DataTree
+        Input data
+    diagnostics : list of str
+        List of diagnostics to plot. Defaults to ["ess_bulk", "ess_tail", "rhat_rank"].
+        Valid diagnostics are "rhat_rank", "rhat_folded", "rhat_z_scale", "rhat_split",
+        "rhat_identity", "ess_bulk", "ess_tail", "ess_mean", "ess_sd", "ess_quantile",
+        "ess_local", "ess_median", "ess_mad", "ess_z_scale", "ess_folded" and "ess_identity".
+    ref_line : bool
+        Whether to plot a reference line for the recommended value of each diagnostic.
+        Defaults to True.
+    var_names : str or list of str, optional
+        One or more variables to be plotted.
+        Prefix the variables by ~ when you want to exclude them from the plot.
+    filter_vars : {None, “like”, “regex”}, optional, default=None
+        If None (default), interpret var_names as the real variables names.
+        If “like”, interpret var_names as substrings of the real variables names.
+        If “regex”, interpret var_names as regular expressions on the real variables names.
+    sample_dims : str or sequence of hashable, optional
+        Dimensions to reduce unless mapped to an aesthetic.
+        Defaults to ``rcParams["data.sample_dims"]``
+    kind : {"kde", "hist", "dot", "ecdf"}, optional
+        How to represent the distribution of diagnostics. Default to ecdf
+    plot_collection : PlotCollection, optional
+    backend : {"matplotlib", "bokeh", "plotly"}, optional
+    labeller : labeller, optional
+    aes_map : mapping of {str : sequence of str}, optional
+        Mapping of artists to aesthetics that should use their mapping in `plot_collection`
+        when plotted. Valid keys are the same as for `plot_kwargs`.
+
+    plot_kwargs : mapping of {str : mapping or False}, optional
+        Valid keys are:
+
+        * One of "kde", "ecdf", "dot" or "hist", matching the `kind` argument.
+
+          * "kde" -> passed to :func:`~arviz_plots.visuals.line_xy`
+          * "ecdf" -> passed to :func:`~arviz_plots.visuals.ecdf_line`
+          * "hist" -> passed to :func: `~arviz_plots.visuals.hist`
+          * "ref_line" -> passed to :func:`~arviz_plots.visuals.axvline`
+
+        * title -> passed to :func:`~arviz_plots.visuals.labelled_title`
+        * remove_axis -> not passed anywhere, can only be ``False`` to skip calling this function
+
+    stats_kwargs : mapping, optional
+        Valid keys are:
+        * density -> passed to kde, ecdf, ...
+
+    pc_kwargs : mapping
+        Passed to :class:`arviz_plots.PlotCollection.wrap`
+
+    Returns
+    -------
+    PlotCollection
+
+    Examples
+    --------
+    Select a single variable and specify diagnostics
+
+    .. plot::
+        :context: close-figs
+
+        >>> from arviz_plots import plot_convergence_dist, style
+        >>> style.use("arviz-clean")
+        >>> from arviz_base import load_arviz_data
+        >>> rugby = load_arviz_data('radon')
+        >>> plot_convergence_dist(radon, var_names=["za_county"], diagnostics=["rhat", "ess_tail"])
+
+     Some ess methods accepts a probability argument
+
+    .. plot::
+        :context: close-figs
+
+        >>> plot_convergence_dist(radon, var_names=["za_county"],
+                     diagnostics=["ess_tail(0.1, 0.9)",
+                                  "ess_local(0.1, 0.9)",
+                                  "ess_quantile(0.9)"])
+
+
+    .. minigallery:: plot_convergence_dist
+
+    """
+    if sample_dims is None:
+        sample_dims = rcParams["data.sample_dims"]
+    if isinstance(sample_dims, str):
+        sample_dims = [sample_dims]
+    sample_dims = list(sample_dims)
+    if plot_kwargs is None:
+        plot_kwargs = {}
+    else:
+        plot_kwargs = plot_kwargs.copy()
+    if pc_kwargs is None:
+        pc_kwargs = {}
+    else:
+        pc_kwargs = pc_kwargs.copy()
+
+    if diagnostics is None:
+        diagnostics = ["ess_bulk", "ess_tail", "rhat_rank"]
+
+    dt = process_group_variables_coords(
+        dt, group=group, var_names=var_names, filter_vars=filter_vars, coords=coords
+    )
+
+    new_ds = _get_diagnostics(dt, diagnostics)
+
+    plot_kwargs.setdefault("credible_interval", False)
+    plot_kwargs.setdefault("point_estimate", False)
+    plot_kwargs.setdefault("point_estimate_text", False)
+
+    plot_collection = plot_dist(
+        new_ds,
+        var_names=None,
+        filter_vars=None,
+        group=None,
+        coords=None,
+        sample_dims=sample_dims,
+        kind=kind,
+        point_estimate=point_estimate,
+        ci_kind=ci_kind,
+        ci_prob=ci_prob,
+        plot_collection=plot_collection,
+        backend=backend,
+        labeller=labeller,
+        aes_map=aes_map,
+        plot_kwargs=plot_kwargs,
+        stats_kwargs=stats_kwargs,
+        pc_kwargs=pc_kwargs,
+    )
+
+    if ref_line:
+        plot_kwargs.setdefault("ref_line", {})
+        if plot_kwargs["ref_line"] is not False:
+            plot_kwargs["ref_line"].setdefault("color", "k")
+            plot_kwargs["ref_line"].setdefault("linestyle", "--")
+            plot_kwargs["ref_line"].setdefault("alpha", 0.5)
+
+        ess_ref = dt.sizes["chain"] * 100
+        # is this valid for all r_hat methods? Do we want to correct for multiple comparisons?
+        r_hat_ref = 1.01
+        for diagnostic in diagnostics:
+            if "ess" in diagnostic:
+                ref = ess_ref
+            if "rhat" in diagnostic:
+                ref = r_hat_ref
+            plot_collection.viz[diagnostic]["plot"].item().axvline(
+                ref, color="k", linestyle="--", alpha=0.5
+            )
+
+    return plot_collection
+
+
+def _get_diagnostics(dt, diagnostics):
+    diagnostic_values = {}
+    for diagnostic in diagnostics:
+        if "ess" in diagnostic:
+            prob = None
+            method = diagnostic.split("_", 1)[1].split("(", 1)[0]
+            if method in {"tail", "quantile", "local"} and "(" in diagnostic:
+                prob = [float(p) for p in diagnostic.split("(", 1)[1].rstrip(")").split(", ")]
+            diagnostic_values[diagnostic] = (
+                dt.azstats.ess(method=method, prob=prob).to_array().values.reshape(1, -1)
+            )
+        elif "rhat" in diagnostic:
+            method = diagnostic.split("_", 1)[1]
+            diagnostic_values[diagnostic] = (
+                dt.azstats.rhat(method=method).to_array().values.reshape(1, -1)
+            )
+        else:
+            warnings.warn(f"{diagnostic} is not recognized as a valid diagnostic")
+    return convert_to_dataset(diagnostic_values)