doc update

rabernat · rabernat · commit 80e4c8742db5 · 2016-05-16T16:37:49.000-04:00
diff --git a/doc/api.rst b/doc/api.rst
@@ -109,6 +109,7 @@ Computation
    Dataset.apply
    Dataset.reduce
    Dataset.groupby
+   Dataset.groupby_bins
    Dataset.resample
    Dataset.diff
 
@@ -245,6 +246,7 @@ Computation
 
    DataArray.reduce
    DataArray.groupby
+   DataArray.groupby_bins
    DataArray.rolling
    DataArray.resample
    DataArray.get_axis_num
diff --git a/doc/groupby.rst b/doc/groupby.rst
@@ -64,6 +64,33 @@ You can also iterate over over groups in ``(label, group)`` pairs:
 Just like in pandas, creating a GroupBy object is cheap: it does not actually
 split the data until you access particular values.
 
+Binning
+~~~~~~~
+
+Sometimes you don't want to use all the unique values to determine the groups
+but instead want to "bin" the data into coarser groups. You could always create
+a customized coordinate, but xarray facilitates this via the
+:py:meth:`~xarray.Dataset.groupby_bins` method.
+
+.. ipython:: python
+
+    x_bins = [0,25,50]
+    ds.groupby_bins('x', x_bins).groups
+
+The binning is implemented via `pandas.cut`__, whose documentation details how
+the bins are assigned. As seen in the example above, by default, the bins are
+labeled with strings using set notation to precisely identify the bin limits. To
+override this behavior, you can specify the bin labels explicitly. Here we
+choose `float` labels which identify the bin centers:
+
+.. ipython:: python
+
+    x_bin_labels = [12.5,37.5]
+    ds.groupby_bins('x', x_bins, labels=x_bin_labels).groups
+
+__ http://pandas.pydata.org/pandas-docs/version/0.17.1/generated/pandas.cut.html
+
+
 Apply
 ~~~~~
 
@@ -170,3 +197,11 @@ __ http://cfconventions.org/cf-conventions/v1.6.0/cf-conventions.html#_two_dimen
     da
     da.groupby('lon').sum()
     da.groupby('lon').apply(lambda x: x - x.mean(), shortcut=False)
+
+Because multidimensional groups have the ability to generate a very large
+number of bins, coarse-binning via :py:meth:`~xarray.Dataset.groupby_bins`
+may be desirable:
+
+.. ipython:: python
+
+    da.groupby_bins('lon', [0,45,50]).sum()
diff --git a/xarray/core/common.py b/xarray/core/common.py
@@ -345,8 +345,9 @@ def groupby(self, group, squeeze=True):
 
     def groupby_bins(self, group, bins, right=True, labels=None, precision=3,
             include_lowest=False, squeeze=True):
-        """Returns a GroupBy object for performing grouped operations. Rather
-        than using all unique values of `group`, the values are discretized
+        """Returns a GroupBy object for performing grouped operations.
+
+        Rather than using all unique values of `group`, the values are discretized
         first by applying `pandas.cut` [1]_ to `group`.
 
         Parameters
@@ -361,7 +362,7 @@ def groupby_bins(self, group, bins, right=True, labels=None, precision=3,
             sequence it defines the bin edges allowing for non-uniform bin
             width. No extension of the range of x is done in this case.
         right : boolean, optional
-I           ndicates whether the bins include the rightmost edge or not. If
+            Indicates whether the bins include the rightmost edge or not. If
             right == True (the default), then the bins [1,2,3,4] indicate
             (1,2], (2,3], (3,4].
         labels : array or boolean, default None