Documentation changes (#1338)

* modified wrapper to iclude customs things * added examples for extended custom methods * type error correction * corrected minor nits * documentation changes * lint * add changes to changelog Co-authored-by: Oriol (ZBook) <[email protected]>
arviz-devs · Jan 16, 2021 · ce68d3c · ce68d3c
1 parent 25ce6c4
commit ce68d3c
Show file tree

Hide file tree

Showing 3 changed files with 243 additions and 20 deletions.
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -32,6 +32,8 @@
 * Switch to `compact=True` by default in our plots ([1468](https://github.com/arviz-devs/arviz/issues/1468))
 * `plot_elpd`, avoid modifying the input dict ([1477](https://github.com/arviz-devs/arviz/issues/1477))
 * Do not plot divergences in `plot_trace` when `kind=rank_vlines` or `kind=rank_bars` ([1476](https://github.com/arviz-devs/arviz/issues/1476))
+* Allow ignoring `observed` argument of `pymc3.DensityDist` in `from_pymc3` ([1495](https://github.com/arviz-devs/arviz/pull/1495))
+* Make `from_pymc3` compatible with theano-pymc 1.1.0 ([1495](https://github.com/arviz-devs/arviz/pull/1495))
 
 
 ### Deprecation
@@ -43,6 +45,7 @@
   for markdown/notebook parsing in docs ([1406](https://github.com/arviz-devs/arviz/pull/1406))
 * Incorporated `input_core_dims` in `hdi` and `plot_hdi` docstrings ([1410](https://github.com/arviz-devs/arviz/pull/1410))
 * Add documentation pages about experimental `SamplingWrapper`s usage ([1373](https://github.com/arviz-devs/arviz/pull/1373))
+* Extend api documentation about `InferenceData` methods ([1338](https://github.com/arviz-devs/arviz/pull/1338))
 
 ### Experimental
 * Modified `SamplingWrapper` base API ([1373](https://github.com/arviz-devs/arviz/pull/1373))

diff --git a/arviz/data/base.py b/arviz/data/base.py
@@ -276,8 +276,23 @@ def make_attrs(attrs=None, library=None):
     return default_attrs
 
 
-def _extend_xr_method(func):
-    """Make wrapper to extend methods from xr.Dataset to InferenceData Class."""
+def _extend_xr_method(func, doc="", description="", examples="", see_also=""):
+    """Make wrapper to extend methods from xr.Dataset to InferenceData Class.
+
+    Parameters
+    ----------
+    func : callable
+        An xr.Dataset function
+    doc : str
+        docstring for the func
+    description : str
+        the description of the func to be added in docstring
+    examples : str
+        the examples of the func to be added in docstring
+    see_also : str, list
+        the similar methods of func to be included in See Also section of docstring
+
+    """
     # pydocstyle requires a non empty line
 
     @functools.wraps(func)
@@ -296,10 +311,11 @@ def wrapped(self, *args, **kwargs):
 
         return None if _inplace else out
 
-    description = """
-    This method is extended from xarray.Dataset methods. For more info see :meth:`xarray:xarray.Dataset.{method_name}`
+    description_default = """{method_name} method is extended from xarray.Dataset methods.
+    
+    {description}For more info see :meth:`xarray:xarray.Dataset.{method_name}`
     """.format(
-        method_name=func.__name__  # pylint: disable=no-member
+        description=description, method_name=func.__name__  # pylint: disable=no-member
     )
     params = """
     Parameters
@@ -316,14 +332,20 @@ def wrapped(self, *args, **kwargs):
         If ``True``, modify the InferenceData object inplace,
         otherwise, return the modified copy.
     """
-    see_also = """
+
+    if not isinstance(see_also, str):
+        see_also = "\n".join(see_also)
+    see_also_basic = """
     See Also
     --------
     xarray.Dataset.{method_name}
+    {custom_see_also}
     """.format(
-        method_name=func.__name__  # pylint: disable=no-member
+        method_name=func.__name__, custom_see_also=see_also  # pylint: disable=no-member
+    )
+    wrapped.__doc__ = (
+        description_default + params + examples + see_also_basic if doc is None else doc
     )
-    wrapped.__doc__ = description + params + see_also
 
     return wrapped
 

diff --git a/arviz/data/inference_data.py b/arviz/data/inference_data.py
@@ -560,6 +560,11 @@ def sel(
                ...: print(idata_subset.posterior_predictive.coords)
                ...: print(idata_subset.observed_data.coords)
 
+        See Also
+        --------
+        xarray.Dataset.sel : Returns a new dataset with each array indexed by tick labels along
+            the specified dimension(s).
+        isel : Returns a new dataset with each array indexed along the specified dimension(s).
         """
         if chain_prior is not None:
             warnings.warn(
@@ -622,6 +627,35 @@ def isel(
             A new InferenceData object by default.
             When `inplace==True` perform selection in-place and return `None`
 
+        Examples
+        --------
+        Use ``isel`` to discard one chain of the InferenceData object. We first check the
+        dimensions of the original object:
+
+        .. ipython::
+
+            In [1]: import arviz as az
+               ...: idata = az.load_arviz_data("centered_eight")
+               ...: del idata.prior  # prior group only has 1 chain currently
+               ...: print(idata.posterior.coords)
+               ...: print(idata.posterior_predictive.coords)
+               ...: print(idata.observed_data.coords)
+
+        In order to remove the third chain:
+
+        .. ipython::
+
+            In [1]: idata_subset = idata.isel(chain=[0, 1, 3])
+               ...: print(idata_subset.posterior.coords)
+               ...: print(idata_subset.posterior_predictive.coords)
+               ...: print(idata_subset.observed_data.coords)
+
+        See Also
+        --------
+        xarray.Dataset.isel : Returns a new dataset with each array indexed along the specified
+            dimension(s).
+        sel : Returns a new dataset with each array indexed by tick labels along the specified
+            dimension(s).
         """
         groups = self._group_names(groups, filter_groups)
 
@@ -677,6 +711,57 @@ def stack(
             A new InferenceData object by default.
             When `inplace==True` perform selection in-place and return `None`
 
+        Examples
+        --------
+        Use ``stack`` to stack any number of existing dimensions into a single new dimension.
+        We first check the original object:
+
+        .. ipython::
+
+            In [1]: import arviz as az
+               ...: idata = az.load_arviz_data("rugby")
+               ...: idata
+
+        In order to stack two dimensions ``chain`` and ``draw`` to ``sample``, we can use:
+
+        .. ipython::
+
+            In [1]: idata.stack(sample=["chain", "draw"], inplace=True)
+               ...: idata
+
+        We can also take the example of custom InferenceData object and perform stacking. We first
+        check the original object:
+
+        .. ipython::
+
+            In [1]: import arviz as az
+               ...: datadict = {
+                    "a": np.random.randn(100),
+                    "b": np.random.randn(1, 100, 10),
+                    "c": np.random.randn(1, 100, 3, 4),
+                    }
+               ...: coords = {
+                        "c1": np.arange(3),
+                        "c99": np.arange(4),
+                        "b1": np.arange(10),
+                    }
+               ...: dims = {"c": ["c1", "c99"], "b": ["b1"]}
+               ...: idata = az.from_dict(
+               ...:     posterior=datadict, posterior_predictive=datadict, coords=coords, dims=dims
+               ...: )
+               ...: idata
+
+        In order to stack two dimensions ``c1`` and ``c99`` to ``z``, we can use:
+
+        .. ipython::
+
+            In [1]: idata.stack(z=["c1", "c99"], inplace=True)
+               ...: idata
+
+        See Also
+        --------
+        xarray.Dataset.stack : Stack any number of existing dimensions into a single new dimension.
+        unstack : Perform an xarray unstacking on all groups of InferenceData object.
         """
         groups = self._group_names(groups, filter_groups)
 
@@ -727,6 +812,43 @@ def unstack(self, dim=None, groups=None, filter_groups=None, inplace=False):
             A new InferenceData object by default.
             When `inplace==True` perform selection in place and return `None`
 
+        Examples
+        --------
+        Use ``unstack`` to unstack existing dimensions corresponding to MultiIndexes into
+        multiple new dimensions. We first stack two dimensions ``c1`` and ``c99`` to ``z``:
+
+        .. ipython::
+
+            In [1]: import arviz as az
+               ...: datadict = {
+                    "a": np.random.randn(100),
+                    "b": np.random.randn(1, 100, 10),
+                    "c": np.random.randn(1, 100, 3, 4),
+                    }
+               ...: coords = {
+                        "c1": np.arange(3),
+                        "c99": np.arange(4),
+                        "b1": np.arange(10),
+                    }
+               ...: dims = {"c": ["c1", "c99"], "b": ["b1"]}
+               ...: dataset = from_dict(
+               ...:     posterior=datadict, posterior_predictive=datadict, coords=coords, dims=dims
+               ...: )
+               ...: dataset.stack(z=["c1", "c99"], inplace=True)
+               ...: dataset
+
+        In order to unstack the dimension ``z``, we use:
+
+        .. ipython::
+
+            In [1]: dataset.unstack(inplace=True)
+               ...: dataset
+
+        See Also
+        --------
+        xarray.Dataset.unstack : Unstack existing dimensions corresponding to MultiIndexes into
+            multiple new dimensions.
+        stack : Perform an xarray stacking on all groups of InferenceData object.
         """
         groups = self._group_names(groups, filter_groups)
         if isinstance(dim, str):
@@ -769,13 +891,36 @@ def rename(self, name_dict=None, groups=None, filter_groups=None, inplace=False)
             If ``True``, modify the InferenceData object inplace,
             otherwise, return the modified copy.
 
-
         Returns
         -------
         InferenceData
             A new InferenceData object by default.
             When `inplace==True` perform renaming in-place and return `None`
 
+        Examples
+        --------
+        Use ``rename`` to renaming of variable and dimensions on all groups of the InferenceData
+        object. We first check the original object:
+
+        .. ipython::
+
+            In [1]: import arviz as az
+               ...: idata = az.load_arviz_data("rugby")
+               ...: idata
+
+        In order to rename the dimensions and variable, we use:
+
+        .. ipython::
+
+            In [1]: idata.rename({"team": "team_new", "match":"match_new"}, inplace=True)
+               ...: idata
+
+        See Also
+        --------
+        xarray.Dataset.rename : Returns a new object with renamed variables and dimensions.
+        rename_vars : Perform xarray renaming of variable or coordinate names on all groups of
+            an InferenceData object.
+        rename_dims : Perform xarray renaming of dimensions on all groups of InferenceData object.
         """
         groups = self._group_names(groups, filter_groups)
         if "chain" in name_dict.keys() or "draw" in name_dict.keys():
@@ -826,6 +971,33 @@ def rename_vars(self, name_dict=None, groups=None, filter_groups=None, inplace=F
             A new InferenceData object with renamed variables including coordinates by default.
             When `inplace==True` perform renaming in-place and return `None`
 
+        Examples
+        --------
+        Use ``rename_vars`` to renaming of variable and coordinates on all groups of the
+        InferenceData object. We first check the data variables of original object:
+
+        .. ipython::
+
+            In [1]: import arviz as az
+               ...: idata = az.load_arviz_data("rugby")
+               ...: print(list(idata.posterior.data_vars)
+               ...: print(list(idata.prior.data_vars)
+
+        In order to rename the data variables, we use:
+
+        .. ipython::
+
+            In [1]: idata.rename_vars({"home": "home_new"}, inplace=True)
+               ...: print(list(idata.posterior.data_vars)
+               ...: print(list(idata.prior.data_vars)
+
+        See Also
+        --------
+        xarray.Dataset.rename_vars : Returns a new object with renamed variables including
+            coordinates.
+        rename : Perform xarray renaming of variable and dimensions on all groups of
+            an InferenceData object.
+        rename_dims : Perform xarray renaming of dimensions on all groups of InferenceData object.
         """
         groups = self._group_names(groups, filter_groups)
 
@@ -866,13 +1038,39 @@ def rename_dims(self, name_dict=None, groups=None, filter_groups=None, inplace=F
             If ``True``, modify the InferenceData object inplace,
             otherwise, return the modified copy.
 
-
         Returns
         -------
         InferenceData
             A new InferenceData object with renamed dimension by default.
             When `inplace==True` perform renaming in-place and return `None`
 
+        Examples
+        --------
+        Use ``rename_dims`` to renaming of dimensions on all groups of the InferenceData
+        object. We first check the dimensions of original object:
+
+        .. ipython::
+
+            In [1]: import arviz as az
+               ...: idata = az.load_arviz_data("rugby")
+               ...: print(list(idata.posterior.dims)
+               ...: print(list(idata.prior.dims)
+
+        In order to rename the dimensions, we use:
+
+        .. ipython::
+
+            In [1]: idata.rename_dims({"team": "team_new"}, inplace=True)
+               ...: print(list(idata.posterior.dims)
+               ...: print(list(idata.prior.dims)
+
+        See Also
+        --------
+        xarray.Dataset.rename_dims : Returns a new object with renamed dimensions only.
+        rename : Perform xarray renaming of variable and dimensions on all groups of
+            an InferenceData object.
+        rename_vars : Perform xarray renaming of variable or coordinate names on all groups
+            of an InferenceData object.
         """
         groups = self._group_names(groups, filter_groups)
         if "chain" in name_dict.keys() or "draw" in name_dict.keys():
@@ -988,11 +1186,11 @@ def extend(self, other, join="left"):
             else:
                 self._groups.append(group)
 
-    set_index = _extend_xr_method(xr.Dataset.set_index)
+    set_index = _extend_xr_method(xr.Dataset.set_index, see_also="reset_index")
     get_index = _extend_xr_method(xr.Dataset.get_index)
-    reset_index = _extend_xr_method(xr.Dataset.reset_index)
-    set_coords = _extend_xr_method(xr.Dataset.set_coords)
-    reset_coords = _extend_xr_method(xr.Dataset.reset_coords)
+    reset_index = _extend_xr_method(xr.Dataset.reset_index, see_also="set_index")
+    set_coords = _extend_xr_method(xr.Dataset.set_coords, see_also="reset_coords")
+    reset_coords = _extend_xr_method(xr.Dataset.reset_coords, see_also="set_coords")
     assign = _extend_xr_method(xr.Dataset.assign)
     assign_coords = _extend_xr_method(xr.Dataset.assign_coords)
     sortby = _extend_xr_method(xr.Dataset.sortby)
@@ -1002,12 +1200,12 @@ def extend(self, other, join="left"):
     compute = _extend_xr_method(xr.Dataset.compute)
     persist = _extend_xr_method(xr.Dataset.persist)
 
-    mean = _extend_xr_method(xr.Dataset.mean)
-    median = _extend_xr_method(xr.Dataset.median)
-    min = _extend_xr_method(xr.Dataset.min)
-    max = _extend_xr_method(xr.Dataset.max)
-    cumsum = _extend_xr_method(xr.Dataset.cumsum)
-    sum = _extend_xr_method(xr.Dataset.sum)
+    mean = _extend_xr_method(xr.Dataset.mean, see_also="median")
+    median = _extend_xr_method(xr.Dataset.median, see_also="mean")
+    min = _extend_xr_method(xr.Dataset.min, see_also=["max", "sum"])
+    max = _extend_xr_method(xr.Dataset.max, see_also=["min", "sum"])
+    cumsum = _extend_xr_method(xr.Dataset.cumsum, see_also="sum")
+    sum = _extend_xr_method(xr.Dataset.sum, see_also="cumsum")
     quantile = _extend_xr_method(xr.Dataset.quantile)
 
     def _group_names(self, groups, filter_groups=None):