PyPI - arviz - Versions diffs - 0.16.1__py3-none-any.whl → 0.17.1__py3-none-any.whl - Mend

arviz 0.16.1py3-none-any.whl → 0.17.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

arviz/__init__.py +1 -1
arviz/data/inference_data.py +34 -7
arviz/data/io_beanmachine.py +6 -1
arviz/data/io_cmdstanpy.py +439 -50
arviz/data/io_pyjags.py +5 -2
arviz/data/io_pystan.py +1 -2
arviz/labels.py +2 -0
arviz/plots/backends/bokeh/bpvplot.py +7 -2
arviz/plots/backends/bokeh/compareplot.py +7 -4
arviz/plots/backends/bokeh/densityplot.py +0 -1
arviz/plots/backends/bokeh/distplot.py +0 -2
arviz/plots/backends/bokeh/forestplot.py +3 -5
arviz/plots/backends/bokeh/kdeplot.py +0 -2
arviz/plots/backends/bokeh/pairplot.py +0 -4
arviz/plots/backends/matplotlib/bfplot.py +0 -1
arviz/plots/backends/matplotlib/bpvplot.py +3 -3
arviz/plots/backends/matplotlib/compareplot.py +1 -1
arviz/plots/backends/matplotlib/dotplot.py +1 -1
arviz/plots/backends/matplotlib/forestplot.py +2 -4
arviz/plots/backends/matplotlib/kdeplot.py +0 -1
arviz/plots/backends/matplotlib/khatplot.py +0 -1
arviz/plots/backends/matplotlib/lmplot.py +4 -5
arviz/plots/backends/matplotlib/pairplot.py +0 -1
arviz/plots/backends/matplotlib/ppcplot.py +8 -5
arviz/plots/backends/matplotlib/traceplot.py +1 -2
arviz/plots/bfplot.py +7 -6
arviz/plots/bpvplot.py +7 -2
arviz/plots/compareplot.py +2 -2
arviz/plots/ecdfplot.py +37 -112
arviz/plots/elpdplot.py +1 -1
arviz/plots/essplot.py +2 -2
arviz/plots/kdeplot.py +0 -1
arviz/plots/pairplot.py +1 -1
arviz/plots/plot_utils.py +0 -1
arviz/plots/ppcplot.py +51 -45
arviz/plots/separationplot.py +0 -1
arviz/stats/__init__.py +2 -0
arviz/stats/density_utils.py +2 -2
arviz/stats/diagnostics.py +2 -3
arviz/stats/ecdf_utils.py +165 -0
arviz/stats/stats.py +241 -38
arviz/stats/stats_utils.py +36 -7
arviz/tests/base_tests/test_data.py +73 -5
arviz/tests/base_tests/test_plots_bokeh.py +0 -1
arviz/tests/base_tests/test_plots_matplotlib.py +24 -1
arviz/tests/base_tests/test_stats.py +43 -1
arviz/tests/base_tests/test_stats_ecdf_utils.py +153 -0
arviz/tests/base_tests/test_stats_utils.py +3 -3
arviz/tests/external_tests/test_data_beanmachine.py +2 -0
arviz/tests/external_tests/test_data_numpyro.py +3 -3
arviz/tests/external_tests/test_data_pyjags.py +3 -1
arviz/tests/external_tests/test_data_pyro.py +3 -3
arviz/tests/helpers.py +8 -8
arviz/utils.py +15 -7
arviz/wrappers/wrap_pymc.py +1 -1
{arviz-0.16.1.dist-info → arviz-0.17.1.dist-info}/METADATA +16 -15
{arviz-0.16.1.dist-info → arviz-0.17.1.dist-info}/RECORD +60 -58
{arviz-0.16.1.dist-info → arviz-0.17.1.dist-info}/WHEEL +1 -1
{arviz-0.16.1.dist-info → arviz-0.17.1.dist-info}/LICENSE +0 -0
{arviz-0.16.1.dist-info → arviz-0.17.1.dist-info}/top_level.txt +0 -0

arviz/plots/backends/bokeh/compareplot.py CHANGED Viewed

@@ -69,13 +69,14 @@ def plot_compare(
             err_ys.append((y, y))
         # plot them
-        dif_tri = ax.triangle(
+        dif_tri = ax.scatter(
             comp_df[information_criterion].iloc[1:],
             yticks_pos[1::2],
             line_color=plot_kwargs.get("color_dse", "grey"),
             fill_color=plot_kwargs.get("color_dse", "grey"),
             line_width=2,
             size=6,
+            marker="triangle",
         )
         dif_line = ax.multi_line(err_xs, err_ys, line_color=plot_kwargs.get("color_dse", "grey"))
@@ -85,13 +86,14 @@ def plot_compare(
         ax.yaxis.ticker = yticks_pos[::2]
         ax.yaxis.major_label_overrides = dict(zip(yticks_pos[::2], yticks_labels))
-    elpd_circ = ax.circle(
+    elpd_circ = ax.scatter(
         comp_df[information_criterion],
         yticks_pos[::2],
         line_color=plot_kwargs.get("color_ic", "black"),
         fill_color=None,
         line_width=2,
         size=6,
+        marker="circle",
     )
     elpd_label = [elpd_circ]
@@ -110,7 +112,7 @@ def plot_compare(
     labels.append(("ELPD", elpd_label))
-    scale = comp_df["scale"][0]
+    scale = comp_df["scale"].iloc[0]
     if insample_dev:
         p_ic = comp_df[f"p_{information_criterion.split('_')[1]}"]
@@ -120,13 +122,14 @@ def plot_compare(
             correction = -p_ic
         elif scale == "deviance":
             correction = -(2 * p_ic)
-        insample_circ = ax.circle(
+        insample_circ = ax.scatter(
             comp_df[information_criterion] + correction,
             yticks_pos[::2],
             line_color=plot_kwargs.get("color_insample_dev", "black"),
             fill_color=plot_kwargs.get("color_insample_dev", "black"),
             line_width=2,
             size=6,
+            marker="circle",
         )
         labels.append(("In-sample ELPD", [insample_circ]))

arviz/plots/backends/bokeh/densityplot.py CHANGED Viewed

@@ -129,7 +129,6 @@ def _d_helper(
     shade,
     ax,
 ):
     extra = {}
     plotted = []

arviz/plots/backends/bokeh/distplot.py CHANGED Viewed

@@ -145,12 +145,10 @@ def _histplot_bokeh_op(values, values2, rotated, ax, hist_kwargs, is_circular):
         edges = edges.astype(float) - 0.5
     if is_circular:
         if is_circular == "degrees":
             edges = np.deg2rad(edges)
             labels = ["0°", "45°", "90°", "135°", "180°", "225°", "270°", "315°"]
         else:
             labels = [
                 r"0",
                 r"π/4",

arviz/plots/backends/bokeh/forestplot.py CHANGED Viewed

@@ -15,7 +15,6 @@ from ....rcparams import rcParams
 from ....stats import hdi
 from ....stats.density_utils import get_bins, histogram, kde
 from ....stats.diagnostics import _ess, _rhat
-from ....utils import conditional_jit
 from ...plot_utils import _scale_fig_size
 from .. import show_layout
 from . import backend_kwarg_defaults
@@ -277,7 +276,6 @@ class PlotHandler:
         """Collect labels and ticks from plotters."""
         val = self.plotters.values()
-        @conditional_jit(forceobj=True, nopython=False)
         def label_idxs():
             labels, idxs = [], []
             for plotter in val:
@@ -299,7 +297,7 @@ class PlotHandler:
     def legend(self, ax, plotted):
         """Add interactive legend with colorcoded model info."""
         legend_it = []
-        for (model_name, glyphs) in plotted.items():
+        for model_name, glyphs in plotted.items():
             legend_it.append((model_name, glyphs))
         legend = Legend(items=legend_it, orientation="vertical", location="top_left")
@@ -640,7 +638,7 @@ class VarHandler:
             grouped_data = [[(0, datum)] for datum in self.data]
             skip_dims = self.combine_dims.union({"chain"})
         else:
-            grouped_data = [datum.groupby("chain") for datum in self.data]
+            grouped_data = [datum.groupby("chain", squeeze=False) for datum in self.data]
             skip_dims = self.combine_dims
         label_dict = OrderedDict()
@@ -648,7 +646,7 @@ class VarHandler:
         for name, grouped_datum in zip(self.model_names, grouped_data):
             for _, sub_data in grouped_datum:
                 datum_iter = xarray_var_iter(
-                    sub_data,
+                    sub_data.squeeze(),
                     var_names=[self.var_name],
                     skip_dims=skip_dims,
                     reverse_selections=True,

arviz/plots/backends/bokeh/kdeplot.py CHANGED Viewed

@@ -165,7 +165,6 @@ def plot_kde(
         x_x, y_y = np.mgrid[xmin:xmax:g_s, ymin:ymax:g_s]
         if contour:
             scaled_density, *scaled_density_args = _scale_axis(density)
             contourpy_kwargs = _init_kwargs_dict(contour_kwargs.pop("contourpy_kwargs", {}))
@@ -224,7 +223,6 @@ def plot_kde(
             ax.ygrid.grid_line_color = None
         else:
             cmap = pcolormesh_kwargs.pop("cmap", "viridis")
             if isinstance(cmap, str):
                 cmap = get_cmap(cmap)

arviz/plots/backends/bokeh/pairplot.py CHANGED Viewed

@@ -241,11 +241,9 @@ def plot_pair(
     # pylint: disable=too-many-nested-blocks
     for i in range(0, numvars - marginals_offset):
         var1 = flat_var_names[i] if tmp_flat_var_names is None else tmp_flat_var_names[i]
         for j in range(0, numvars - marginals_offset):
             var2 = (
                 flat_var_names[j + marginals_offset]
                 if tmp_flat_var_names is None
@@ -268,7 +266,6 @@ def plot_pair(
                 ax[j, i].yaxis.axis_label = flat_var_names[j + marginals_offset]
             elif j + marginals_offset > i:
                 if "scatter" in kind:
                     if divergences:
                         ax[j, i].circle(var1, var2, source=source, view=source_nondiv)
@@ -328,7 +325,6 @@ def plot_pair(
                     ax[j, i].add_layout(ax_vline)
                     if marginals:
                         ax[j - 1, i].add_layout(ax_vline)
                         pe_last = calculate_point_estimate(point_estimate, plotters[-1][-1])

arviz/plots/backends/matplotlib/bfplot.py CHANGED Viewed

@@ -23,7 +23,6 @@ def plot_bf(
     backend_kwargs,
     show,
 ):
     """Matplotlib Bayes Factor plot."""
     if backend_kwargs is None:
         backend_kwargs = {}

arviz/plots/backends/matplotlib/bpvplot.py CHANGED Viewed

@@ -86,6 +86,9 @@ def plot_bpv(
         obs_vals = obs_vals.flatten()
         pp_vals = pp_vals.reshape(total_pp_samples, -1)
+        if obs_vals.dtype.kind == "i" or pp_vals.dtype.kind == "i":
+            obs_vals, pp_vals = smooth_data(obs_vals, pp_vals)
         if kind == "p_value":
             tstat_pit = np.mean(pp_vals <= obs_vals, axis=-1)
             x_s, tstat_pit_dens = kde(tstat_pit)
@@ -110,9 +113,6 @@ def plot_bpv(
                     ax_i.plot(x_ss, u_dens, linewidth=linewidth, **plot_ref_kwargs)
         elif kind == "u_value":
-            if obs_vals.dtype.kind == "i" or pp_vals.dtype.kind == "i":
-                obs_vals, pp_vals = smooth_data(obs_vals, pp_vals)
             tstat_pit = np.mean(pp_vals <= obs_vals, axis=0)
             x_s, tstat_pit_dens = kde(tstat_pit)
             ax_i.plot(x_s, tstat_pit_dens, color=color)

arviz/plots/backends/matplotlib/compareplot.py CHANGED Viewed

@@ -84,7 +84,7 @@ def plot_compare(
     else:
         ax.set_yticks(yticks_pos[::2])
-    scale = comp_df["scale"][0]
+    scale = comp_df["scale"].iloc[0]
     if insample_dev:
         p_ic = comp_df[f"p_{information_criterion.split('_')[1]}"]

arviz/plots/backends/matplotlib/dotplot.py CHANGED Viewed

@@ -97,7 +97,7 @@ def plot_dot(
     stack_locs, stack_count = wilkinson_algorithm(values, binwidth)
     x, y = layout_stacks(stack_locs, stack_count, binwidth, stackratio, rotated)
-    for (x_i, y_i) in zip(x, y):
+    for x_i, y_i in zip(x, y):
         dot = plt.Circle((x_i, y_i), dotsize * binwidth / 2, **plot_kwargs)
         ax.add_patch(dot)

arviz/plots/backends/matplotlib/forestplot.py CHANGED Viewed

@@ -11,7 +11,6 @@ from ....stats import hdi
 from ....stats.density_utils import get_bins, histogram, kde
 from ....stats.diagnostics import _ess, _rhat
 from ....sel_utils import xarray_var_iter
-from ....utils import conditional_jit
 from ...plot_utils import _scale_fig_size
 from . import backend_kwarg_defaults, backend_show
@@ -236,7 +235,6 @@ class PlotHandler:
         """Collect labels and ticks from plotters."""
         val = self.plotters.values()
-        @conditional_jit(forceobj=True, nopython=False)
         def label_idxs():
             labels, idxs = [], []
             for plotter in val:
@@ -536,7 +534,7 @@ class VarHandler:
             grouped_data = [[(0, datum)] for datum in self.data]
             skip_dims = self.combine_dims.union({"chain"})
         else:
-            grouped_data = [datum.groupby("chain") for datum in self.data]
+            grouped_data = [datum.groupby("chain", squeeze=False) for datum in self.data]
             skip_dims = self.combine_dims
         label_dict = OrderedDict()
@@ -544,7 +542,7 @@ class VarHandler:
         for name, grouped_datum in zip(self.model_names, grouped_data):
             for _, sub_data in grouped_datum:
                 datum_iter = xarray_var_iter(
-                    sub_data,
+                    sub_data.squeeze(),
                     var_names=[self.var_name],
                     skip_dims=skip_dims,
                     reverse_selections=True,

arviz/plots/backends/matplotlib/kdeplot.py CHANGED Viewed

@@ -88,7 +88,6 @@ def plot_kde(
         rug_space = max(density) * rug_kwargs.pop("space")
         if is_circular:
             if is_circular == "radians":
                 labels = [
                     "0",

arviz/plots/backends/matplotlib/khatplot.py CHANGED Viewed

@@ -201,7 +201,6 @@ def _make_hover_annotation(fig, ax, sc_plot, coord_labels, rgba_c, hover_format)
     offset = 10
     def update_annot(ind):
         idx = ind["ind"][0]
         pos = sc_plot.get_offsets()[idx]
         annot_text = hover_format.format(idx, coord_labels[idx])

arviz/plots/backends/matplotlib/lmplot.py CHANGED Viewed

@@ -50,7 +50,6 @@ def plot_lm(
         _, axes = create_axes_grid(length_plotters, rows, cols, backend_kwargs=backend_kwargs)
     for i, ax_i in enumerate(np.ravel(axes)[:length_plotters]):
         # All the kwargs are defined here beforehand
         y_kwargs = matplotlib_kwarg_dealiaser(y_kwargs, "plot")
         y_kwargs.setdefault("color", "C3")
@@ -68,22 +67,22 @@ def plot_lm(
         y_hat_plot_kwargs.setdefault("linewidth", 0)
         y_hat_fill_kwargs = matplotlib_kwarg_dealiaser(y_hat_fill_kwargs, "fill_between")
-        y_hat_fill_kwargs.setdefault("color", "C1")
+        y_hat_fill_kwargs.setdefault("color", "C3")
         y_model_plot_kwargs = matplotlib_kwarg_dealiaser(y_model_plot_kwargs, "plot")
-        y_model_plot_kwargs.setdefault("color", "k")
+        y_model_plot_kwargs.setdefault("color", "C6")
         y_model_plot_kwargs.setdefault("alpha", 0.5)
         y_model_plot_kwargs.setdefault("linewidth", 0.5)
         y_model_plot_kwargs.setdefault("zorder", 9)
         y_model_fill_kwargs = matplotlib_kwarg_dealiaser(y_model_fill_kwargs, "fill_between")
-        y_model_fill_kwargs.setdefault("color", "k")
+        y_model_fill_kwargs.setdefault("color", "C0")
         y_model_fill_kwargs.setdefault("linewidth", 0.5)
         y_model_fill_kwargs.setdefault("zorder", 9)
         y_model_fill_kwargs.setdefault("alpha", 0.5)
         y_model_mean_kwargs = matplotlib_kwarg_dealiaser(y_model_mean_kwargs, "plot")
-        y_model_mean_kwargs.setdefault("color", "y")
+        y_model_mean_kwargs.setdefault("color", "C6")
         y_model_mean_kwargs.setdefault("linewidth", 0.8)
         y_model_mean_kwargs.setdefault("zorder", 11)

arviz/plots/backends/matplotlib/pairplot.py CHANGED Viewed

@@ -291,7 +291,6 @@ def plot_pair(
                         ax[j, i].scatter(var1, var2, **scatter_kwargs)
                     if "kde" in kind:
                         plot_kde(
                             var1,
                             var2,

arviz/plots/backends/matplotlib/ppcplot.py CHANGED Viewed

@@ -371,8 +371,6 @@ def plot_ppc(
         if legend:
             if i == 0:
                 ax_i.legend(fontsize=xt_labelsize * 0.75)
-            else:
-                ax_i.legend([])
     if backend_show(show):
         plt.show()
@@ -414,15 +412,20 @@ def _set_animation(
         else:
             vals = pp_sampled_vals[0]
-            _, y_vals, x_vals = histogram(vals, bins="auto")
+            bins = get_bins(vals)
+            _, y_vals, x_vals = histogram(vals, bins=bins)
             (line,) = ax.plot(x_vals[:-1], y_vals, **plot_kwargs)
-            max_max = max(max(histogram(pp_sampled_vals[i], bins="auto")[1]) for i in range(length))
+            max_max = max(
+                max(histogram(pp_sampled_vals[i], bins=get_bins(pp_sampled_vals[i]))[1])
+                for i in range(length)
+            )
             ax.set_ylim(0, max_max)
             def animate(i):
-                _, y_vals, x_vals = histogram(pp_sampled_vals[i], bins="auto")
+                pp_vals = pp_sampled_vals[i]
+                _, y_vals, x_vals = histogram(pp_vals, bins=get_bins(pp_vals))
                 line.set_data(x_vals[:-1], y_vals)
                 return (line,)

arviz/plots/backends/matplotlib/traceplot.py CHANGED Viewed

@@ -430,7 +430,7 @@ def plot_trace(
             Line2D(
                 [], [], label=chain_id, **dealiase_sel_kwargs(legend_kwargs, chain_prop, chain_id)
             )
-            for chain_id in range(data.dims["chain"])
+            for chain_id in range(data.sizes["chain"])
         ]
         if combined:
             handles.insert(
@@ -470,7 +470,6 @@ def _plot_chains_mpl(
     circ_var_units,
     circ_units_trace,
 ):
     if not circular:
         circ_var_units = False

arviz/plots/bfplot.py CHANGED Viewed

@@ -38,7 +38,7 @@ def plot_bf(
     algorithm presented in [1]_.
     Parameters
-    -----------
+    ----------
     idata : InferenceData
         Any object that can be converted to an :class:`arviz.InferenceData` object
         Refer to documentation of :func:`arviz.convert_to_dataset` for details.
@@ -52,16 +52,16 @@ def plot_bf(
         Tuple of valid Matplotlib colors. First element for the prior, second for the posterior.
     figsize : (float, float), optional
         Figure size. If `None` it will be defined automatically.
-    textsize: float, optional
+    textsize : float, optional
         Text size scaling factor for labels, titles and lines. If `None` it will be auto
         scaled based on `figsize`.
-    plot_kwargs : dicts, optional
+    plot_kwargs : dict, optional
         Additional keywords passed to :func:`matplotlib.pyplot.plot`.
-    hist_kwargs : dicts, optional
+    hist_kwargs : dict, optional
         Additional keywords passed to :func:`arviz.plot_dist`. Only works for discrete variables.
     ax : axes, optional
         :class:`matplotlib.axes.Axes` or :class:`bokeh.plotting.Figure`.
-    backend :{"matplotlib", "bokeh"}, default "matplotlib"
+    backend : {"matplotlib", "bokeh"}, default "matplotlib"
         Select plotting backend.
     backend_kwargs : dict, optional
         These are kwargs specific to the backend being used, passed to
@@ -78,7 +78,7 @@ def plot_bf(
     References
     ----------
     .. [1] Heck, D., 2019. A caveat on the Savage-Dickey density ratio:
-    The case of computing Bayes factors for regression parameters.
+       The case of computing Bayes factors for regression parameters.
     Examples
     --------
@@ -92,6 +92,7 @@ def plot_bf(
         >>> idata = az.from_dict(posterior={"a":np.random.normal(1, 0.5, 5000)},
         ...     prior={"a":np.random.normal(0, 1, 5000)})
         >>> az.plot_bf(idata, var_name="a", ref_val=0)
     """
     posterior = extract(idata, var_names=var_name).values

arviz/plots/bpvplot.py CHANGED Viewed

@@ -162,6 +162,11 @@ def plot_bpv(
     ----------
     * Gelman et al. (2013) see http://www.stat.columbia.edu/~gelman/book/ pages 151-153 for details
+    Notes
+    -----
+    Discrete data is smoothed before computing either p-values or u-values using the
+    function :func:`~arviz.smooth_data`
     Examples
     --------
     Plot Bayesian p_values.
@@ -225,11 +230,11 @@ def plot_bpv(
     if flatten_pp is None:
         if flatten is None:
-            flatten_pp = list(predictive_dataset.dims.keys())
+            flatten_pp = list(predictive_dataset.dims)
         else:
             flatten_pp = flatten
     if flatten is None:
-        flatten = list(observed.dims.keys())
+        flatten = list(observed.dims)
     if coords is None:
         coords = {}

arviz/plots/compareplot.py CHANGED Viewed

@@ -90,10 +90,10 @@ def plot_compare(
     References
     ----------
     .. [1] Vehtari et al. (2016). Practical Bayesian model evaluation using leave-one-out
-    cross-validation and WAIC https://arxiv.org/abs/1507.04544
+       cross-validation and WAIC https://arxiv.org/abs/1507.04544
     .. [2] McElreath R. (2022). Statistical Rethinking A Bayesian Course with Examples in
-    R and Stan, Second edition, CRC Press.
+       R and Stan, Second edition, CRC Press.
     Examples
     --------

arviz/plots/ecdfplot.py CHANGED Viewed

@@ -1,8 +1,9 @@
 """Plot ecdf or ecdf-difference plot with confidence bands."""
 import numpy as np
-from scipy.stats import uniform, binom
+from scipy.stats import uniform
 from ..rcparams import rcParams
+from ..stats.ecdf_utils import compute_ecdf, ecdf_confidence_band, _get_ecdf_points
 from .plot_utils import get_plotting_function
@@ -26,7 +27,7 @@ def plot_ecdf(
     show=None,
     backend=None,
     backend_kwargs=None,
-    **kwargs
+    **kwargs,
 ):
     r"""Plot ECDF or ECDF-Difference Plot with Confidence bands.
@@ -48,6 +49,7 @@ def plot_ecdf(
         Values to compare to the original sample.
     cdf : callable, optional
         Cumulative distribution function of the distribution to compare the original sample.
+        The function must take as input a numpy array of draws from the distribution.
     difference : bool, default False
         If True then plot ECDF-difference plot otherwise ECDF plot.
     pit : bool, default False
@@ -180,75 +182,47 @@ def plot_ecdf(
     values = np.ravel(values)
     values.sort()
-    ## This block computes gamma and uses it to get the upper and lower confidence bands
-    ## Here we check if we want confidence bands or not
-    if confidence_bands:
-        ## If plotting PIT then we find the PIT values of sample.
-        ## Basically here we generate the evaluation points(x) and find the PIT values.
-        ## z is the evaluation point for our uniform distribution in compute_gamma()
-        if pit:
-            x = np.linspace(1 / npoints, 1, npoints)
-            z = x
-            ## Finding PIT for our sample
-            probs = cdf(values) if cdf else compute_ecdf(values2, values) / len(values2)
-        else:
-            ## If not PIT use sample for plots and for evaluation points(x) use equally spaced
-            ## points between minimum and maximum of sample
-            ## For z we have used cdf(x)
-            x = np.linspace(values[0], values[-1], npoints)
-            z = cdf(x) if cdf else compute_ecdf(values2, x)
-            probs = values
-        n = len(values)  # number of samples
-        ## Computing gamma
-        gamma = fpr if pointwise else compute_gamma(n, z, npoints, num_trials, fpr)
-        ## Using gamma to get the confidence intervals
-        lower, higher = get_lims(gamma, n, z)
-        ## This block is for whether to plot ECDF or ECDF-difference
-        if not difference:
-            ## We store the coordinates of our ecdf in x_coord, y_coord
-            x_coord, y_coord = get_ecdf_points(x, probs, difference)
+    if pit:
+        eval_points = np.linspace(1 / npoints, 1, npoints)
+        if cdf:
+            sample = cdf(values)
         else:
-            ## Here we subtract the ecdf value as here we are plotting the ECDF-difference
-            x_coord, y_coord = get_ecdf_points(x, probs, difference)
-            for i, x_i in enumerate(x):
-                y_coord[i] = y_coord[i] - (
-                    x_i if pit else cdf(x_i) if cdf else compute_ecdf(values2, x_i)
-                )
-            ## Similarly we subtract from the upper and lower bounds
-            if pit:
-                lower = lower - x
-                higher = higher - x
-            else:
-                lower = lower - (cdf(x) if cdf else compute_ecdf(values2, x))
-                higher = higher - (cdf(x) if cdf else compute_ecdf(values2, x))
+            sample = compute_ecdf(values2, values) / len(values2)
+        cdf_at_eval_points = eval_points
+        rvs = uniform(0, 1).rvs
     else:
-        if pit:
-            x = np.linspace(1 / npoints, 1, npoints)
-            probs = cdf(values)
+        eval_points = np.linspace(values[0], values[-1], npoints)
+        sample = values
+        if confidence_bands or difference:
+            if cdf:
+                cdf_at_eval_points = cdf(eval_points)
+            else:
+                cdf_at_eval_points = compute_ecdf(values2, eval_points)
         else:
-            x = np.linspace(values[0], values[-1], npoints)
-            probs = values
+            cdf_at_eval_points = np.zeros_like(eval_points)
+        rvs = None
+    x_coord, y_coord = _get_ecdf_points(sample, eval_points, difference)
+    if difference:
+        y_coord -= cdf_at_eval_points
+    if confidence_bands:
+        ndraws = len(values)
+        band_kwargs = {"prob": 1 - fpr, "num_trials": num_trials, "rvs": rvs, "random_state": None}
+        band_kwargs["method"] = "pointwise" if pointwise else "simulated"
+        lower, higher = ecdf_confidence_band(ndraws, eval_points, cdf_at_eval_points, **band_kwargs)
+        if difference:
+            lower -= cdf_at_eval_points
+            higher -= cdf_at_eval_points
+    else:
         lower, higher = None, None
-        ## This block is for whether to plot ECDF or ECDF-difference
-        if not difference:
-            x_coord, y_coord = get_ecdf_points(x, probs, difference)
-        else:
-            ## Here we subtract the ecdf value as here we are plotting the ECDF-difference
-            x_coord, y_coord = get_ecdf_points(x, probs, difference)
-            for i, x_i in enumerate(x):
-                y_coord[i] = y_coord[i] - (
-                    x_i if pit else cdf(x_i) if cdf else compute_ecdf(values2, x_i)
-                )
     ecdf_plot_args = dict(
         x_coord=x_coord,
         y_coord=y_coord,
-        x_bands=x,
+        x_bands=eval_points,
         lower=lower,
         higher=higher,
         confidence_bands=confidence_bands,
@@ -260,7 +234,7 @@ def plot_ecdf(
         ax=ax,
         show=show,
         backend_kwargs=backend_kwargs,
-        **kwargs
+        **kwargs,
     )
     if backend is None:
@@ -271,52 +245,3 @@ def plot_ecdf(
     ax = plot(**ecdf_plot_args)
     return ax
-def compute_ecdf(sample, z):
-    """Compute ECDF.
-    This function computes the ecdf value at the evaluation point
-        or a sorted set of evaluation points.
-    """
-    return np.searchsorted(sample, z, side="right") / len(sample)
-def get_ecdf_points(x, probs, difference):
-    """Compute the coordinates for the ecdf points using compute_ecdf."""
-    y = compute_ecdf(probs, x)
-    if not difference:
-        x = np.insert(x, 0, x[0])
-        y = np.insert(y, 0, 0)
-    return x, y
-def compute_gamma(n, z, npoints=None, num_trials=1000, fpr=0.05):
-    """Compute gamma for confidence interval calculation.
-    This function simulates an adjusted value of gamma to account for multiplicity
-    when forming an 1-fpr level confidence envelope for the ECDF of a sample.
-    """
-    if npoints is None:
-        npoints = n
-    gamma = []
-    for _ in range(num_trials):
-        unif_samples = uniform.rvs(0, 1, n)
-        unif_samples = np.sort(unif_samples)
-        gamma_m = 1000
-        ## Can compute ecdf for all the z together or one at a time.
-        f_z = compute_ecdf(unif_samples, z)
-        f_z = compute_ecdf(unif_samples, z)
-        gamma_m = 2 * min(
-            np.amin(binom.cdf(n * f_z, n, z)), np.amin(1 - binom.cdf(n * f_z - 1, n, z))
-        )
-        gamma.append(gamma_m)
-    return np.quantile(gamma, fpr)
-def get_lims(gamma, n, z):
-    """Compute the simultaneous 1 - fpr level confidence bands."""
-    lower = binom.ppf(gamma / 2, n, z)
-    upper = binom.ppf(1 - gamma / 2, n, z)
-    return lower / n, upper / n

arviz/plots/elpdplot.py CHANGED Viewed

@@ -98,7 +98,7 @@ def plot_elpd(
     References
     ----------
     .. [1] Vehtari et al. (2016). Practical Bayesian model evaluation using leave-one-out
-    cross-validation and WAIC https://arxiv.org/abs/1507.04544
+       cross-validation and WAIC https://arxiv.org/abs/1507.04544
     Examples
     --------

arviz/plots/essplot.py CHANGED Viewed

@@ -202,8 +202,8 @@ def plot_ess(
     data = get_coords(convert_to_dataset(idata, group="posterior"), coords)
     var_names = _var_names(var_names, data, filter_vars)
-    n_draws = data.dims["draw"]
-    n_samples = n_draws * data.dims["chain"]
+    n_draws = data.sizes["draw"]
+    n_samples = n_draws * data.sizes["chain"]
     ess_tail_dataset = None
     mean_ess = None

arviz 0.16.1__py3-none-any.whl → 0.17.1__py3-none-any.whl

arviz 0.16.1py3-none-any.whl → 0.17.1py3-none-any.whl