pandas-dev · jbrockmendel · Nov 25, 2018 · Nov 25, 2018 · Nov 25, 2018 · Nov 28, 2018
diff --git a/pandas/core/arrays/datetimelike.py b/pandas/core/arrays/datetimelike.py
@@ -12,6 +12,7 @@
 from pandas._libs.tslibs.timedeltas import Timedelta, delta_to_nanoseconds
 from pandas._libs.tslibs.timestamps import maybe_integer_op_deprecated
 import pandas.compat as compat
+from pandas.compat.numpy import function as nv
 from pandas.errors import (
     AbstractMethodError, NullFrequencyError, PerformanceWarning)
 from pandas.util._decorators import deprecate_kwarg
@@ -27,13 +28,55 @@
 
 from pandas.core.algorithms import checked_add_with_arr, take, unique1d
 import pandas.core.common as com
+from pandas.core.nanops import nanstd
 
 from pandas.tseries import frequencies
 from pandas.tseries.offsets import DateOffset, Tick
 
 from .base import ExtensionOpsMixin
 
 
+def _get_reduction_vals(obj, skipna):
+    if not len(obj):
+        return NaT
+
+    if obj.hasnans:
+        if not skipna:
+            return NaT
+        vals = obj.asi8[~obj._isnan]
+    else:
+        vals = obj.asi8
+    return vals
+
+
+def _make_reduction(op, diff=False, only_timedelta=False):
+    """
+    Make a unary reduction method that handles NaT appropriately.
+    """
+
+    def method(self, skipna=True, **kwargs):
+        if only_timedelta:
+            raise TypeError('"{meth}" reduction is not valid for {cls}'
+                            .format(meth=op.__name__, cls=type(self).__name__))
+
+        vals = _get_reduction_vals(self, skipna)
+        if vals is NaT:
+            return NaT
+
+        # Try to minimize floating point error by rounding before casting
+        #  to int64
+        result = op(vals, **kwargs)
+        result = np.float64(result).round()
+        result = np.int64(result)
+        if diff:
+            return self._box_func(result) - self._box_func(0)
+        return self._box_func(result)
+
+    method.__name__ = op.__name__
+    # TODO: __doc__
+    return method
+
+
 def _make_comparison_op(cls, op):
     # TODO: share code with indexes.base version?  Main difference is that
     # the block for MultiIndex was removed here.
@@ -364,6 +407,19 @@ def _validate_frequency(cls, index, freq, **kwargs):
                              'does not conform to passed frequency {passed}'
                              .format(infer=inferred, passed=freq.freqstr))
 
+    # ----------------------------------------------------------------
+    # Reductions
+
+    min = _make_reduction(np.min)
+    max = _make_reduction(np.max)
+
+    mean = _make_reduction(np.mean)
+    median = _make_reduction(np.median)
+    std = _make_reduction(nanstd, diff=True)
+
+    sum = _make_reduction(np.sum, only_timedelta=True)
+    # cumsum = _make_reduction(np.cumsum, only_timedelta=True)
+
     # ------------------------------------------------------------------
     # Arithmetic Methods
 

diff --git a/pandas/core/base.py b/pandas/core/base.py
@@ -795,7 +795,7 @@ def _ndarray_values(self):
     def empty(self):
         return not self.size
 
-    def max(self):
+    def max(self, skipna=True, axis=None):
         """
         Return the maximum value of the Index.
 
@@ -826,19 +826,21 @@ def max(self):
         >>> idx.max()
         ('b', 2)
         """
+        nv.validate_minmax_axis(axis)
         return nanops.nanmax(self.values)
 
-    def argmax(self, axis=None):
+    def argmax(self, skipna=True, axis=None):
         """
         Return a ndarray of the maximum argument indexer.
 
         See Also
         --------
         numpy.ndarray.argmax
         """
+        nv.validate_minmax_axis(axis)
         return nanops.nanargmax(self.values)
 
-    def min(self):
+    def min(self, skipna=True, axis=None):
         """
         Return the minimum value of the Index.
 
@@ -869,16 +871,18 @@ def min(self):
         >>> idx.min()
         ('a', 1)
         """
+        nv.validate_minmax_axis(axis)
         return nanops.nanmin(self.values)
 
-    def argmin(self, axis=None):
+    def argmin(self, skipna=True, axis=None):
         """
         Return a ndarray of the minimum argument indexer.
 
         See Also
         --------
         numpy.ndarray.argmin
         """
+        nv.validate_minmax_axis(axis)
         return nanops.nanargmin(self.values)
 
     def tolist(self):

diff --git a/pandas/core/indexes/datetimelike.py b/pandas/core/indexes/datetimelike.py
@@ -442,7 +442,7 @@ def tolist(self):
         """
         return list(self.astype(object))
 
-    def min(self, axis=None, *args, **kwargs):
+    def min(self, skipna=True, axis=None, *args, **kwargs):
         """
         Return the minimum value of the Index or minimum along
         an axis.
@@ -470,7 +470,7 @@ def min(self, axis=None, *args, **kwargs):
         except ValueError:
             return self._na_value
 
-    def argmin(self, axis=None, *args, **kwargs):
+    def argmin(self, skipna=True, axis=None, *args, **kwargs):
         """
         Returns the indices of the minimum values along an axis.
 
@@ -493,7 +493,7 @@ def argmin(self, axis=None, *args, **kwargs):
             i8[mask] = np.iinfo('int64').max
         return i8.argmin()
 
-    def max(self, axis=None, *args, **kwargs):
+    def max(self, skipna=True, axis=None, *args, **kwargs):
         """
         Return the maximum value of the Index or maximum along
         an axis.
@@ -521,7 +521,7 @@ def max(self, axis=None, *args, **kwargs):
         except ValueError:
             return self._na_value
 
-    def argmax(self, axis=None, *args, **kwargs):
+    def argmax(self, skipna=True, axis=None, *args, **kwargs):
         """
         Returns the indices of the maximum values along an axis.
 

diff --git a/pandas/core/indexes/period.py b/pandas/core/indexes/period.py
@@ -14,7 +14,7 @@
 
 from pandas.core.dtypes.common import (
     is_bool_dtype, is_datetime64_any_dtype, is_float, is_float_dtype,
-    is_integer, is_integer_dtype, pandas_dtype)
+    is_integer, is_integer_dtype, is_scalar, pandas_dtype)
 
 from pandas import compat
 from pandas.core import common as com
@@ -72,6 +72,9 @@ def _delegate_property_set(self, name, value, *args, **kwargs):
 
     def _delegate_method(self, name, *args, **kwargs):
         result = operator.methodcaller(name, *args, **kwargs)(self._data)
+        if is_scalar(result):
+            # e.g. min, max, mean, ...
+            return result
         return Index(result, name=self.name)
 
 

diff --git a/pandas/core/indexes/range.py b/pandas/core/indexes/range.py
@@ -25,7 +25,6 @@
 
 
 class RangeIndex(Int64Index):
-
     """
     Immutable Index implementing a monotonic integer range.
 
@@ -288,11 +287,11 @@ def _minmax(self, meth):
 
         return self._start + self._step * no_steps
 
-    def min(self):
+    def min(self, skipna=True, axis=None):
         """The minimum value of the RangeIndex"""
         return self._minmax('min')
 
-    def max(self):
+    def max(self, skipna=True, axis=None):
         """The maximum value of the RangeIndex"""
         return self._minmax('max')
 

diff --git a/pandas/core/nanops.py b/pandas/core/nanops.py
@@ -12,8 +12,8 @@
 from pandas.core.dtypes.cast import _int64_max, maybe_upcast_putmask
 from pandas.core.dtypes.common import (
     _get_dtype, is_any_int_dtype, is_bool_dtype, is_complex, is_complex_dtype,
-    is_datetime64_dtype, is_datetime_or_timedelta_dtype, is_float,
-    is_float_dtype, is_integer, is_integer_dtype, is_numeric_dtype,
+    is_datetime64_dtype, is_datetime64tz_dtype, is_datetime_or_timedelta_dtype,
+    is_float, is_float_dtype, is_integer, is_integer_dtype, is_numeric_dtype,
     is_object_dtype, is_scalar, is_timedelta64_dtype)
 from pandas.core.dtypes.missing import isna, na_value_for_dtype, notna
 
@@ -426,7 +426,6 @@ def nansum(values, axis=None, skipna=True, min_count=0, mask=None):
     return _wrap_results(the_sum, dtype)
 
 
-@disallow('M8')
 @bottleneck_switch()
 def nanmean(values, axis=None, skipna=True, mask=None):
     """
@@ -462,6 +461,14 @@ def nanmean(values, axis=None, skipna=True, mask=None):
     elif is_float_dtype(dtype):
         dtype_sum = dtype
         dtype_count = dtype
+    elif is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        from pandas import DatetimeIndex
+        masked_vals = values
+        if mask is not None:
+            masked_vals = values[~mask]
+        the_mean = DatetimeIndex(masked_vals).mean(skipna=skipna)
+        return the_mean
+
     count = _get_counts(mask, axis, dtype=dtype_count)
     the_sum = _ensure_numeric(values.sum(axis, dtype=dtype_sum))
 
@@ -476,7 +483,6 @@ def nanmean(values, axis=None, skipna=True, mask=None):
     return _wrap_results(the_mean, dtype)
 
 
-@disallow('M8')
 @bottleneck_switch()
 def nanmedian(values, axis=None, skipna=True, mask=None):
     """
@@ -508,6 +514,14 @@ def get_median(x):
         return np.nanmedian(x[mask])
 
     values, mask, dtype, dtype_max, _ = _get_values(values, skipna, mask=mask)
+
+    if is_datetime64_dtype(dtype) or is_datetime64tz_dtype(dtype):
+        from pandas import DatetimeIndex
+        masked_vals = values
+        if mask is not None:
+            masked_vals = values[~mask]
+        return DatetimeIndex(masked_vals).median(skipna=skipna)
+
     if not is_float_dtype(values):
         values = values.astype('f8')
         values[mask] = np.nan
@@ -561,7 +575,6 @@ def _get_counts_nanvar(mask, axis, ddof, dtype=float):
     return count, d
 
 
-@disallow('M8')
 @bottleneck_switch(ddof=1)
 def nanstd(values, axis=None, skipna=True, ddof=1, mask=None):
     """
@@ -591,6 +604,14 @@ def nanstd(values, axis=None, skipna=True, ddof=1, mask=None):
     >>> nanops.nanstd(s)
     1.0
     """
+    if is_datetime64_dtype(values) or is_datetime64tz_dtype(values):
+        from pandas import DatetimeIndex
+        masked_vals = values
+        if mask is not None:
+            masked_vals = values[~mask]
+        return DatetimeIndex(masked_vals).std(skipna=skipna)
+        # TODO: adjust by ddof?
+
     result = np.sqrt(nanvar(values, axis=axis, skipna=skipna, ddof=ddof,
                             mask=mask))
     return _wrap_results(result, values.dtype)

diff --git a/pandas/core/series.py b/pandas/core/series.py
@@ -29,7 +29,8 @@
     is_integer, is_integer_dtype, is_iterator, is_list_like, is_object_dtype,
     is_scalar, is_string_like, is_timedelta64_dtype, pandas_dtype)
 from pandas.core.dtypes.generic import (
-    ABCDataFrame, ABCIndexClass, ABCSeries, ABCSparseArray, ABCSparseSeries)
+    ABCDataFrame, ABCDatetimeIndex, ABCIndexClass, ABCSeries, ABCSparseArray,
+    ABCSparseSeries)
 from pandas.core.dtypes.missing import (
     isna, na_value_for_dtype, notna, remove_na_arraylike)
 
@@ -3454,6 +3455,16 @@ def _reduce(self, op, name, axis=0, skipna=True, numeric_only=None,
         # dispatch to ExtensionArray interface
         if isinstance(delegate, ExtensionArray):
             return delegate._reduce(name, skipna=skipna, **kwds)
+        if (isinstance(delegate, ABCDatetimeIndex) and
+                name in ['mean', 'median', 'std', 'min', 'max']):
+            if numeric_only or filter_type:
+                raise TypeError
+            method = getattr(delegate, name)
+            try:
+                return method(skipna=skipna, **kwds)
+            except TypeError:
+                # kludge because not all reduction implementations take skipna
+                return method(**kwds)
 
         # dispatch to numpy arrays
         elif isinstance(delegate, np.ndarray):

diff --git a/pandas/tests/indexes/datetimes/test_ops.py b/pandas/tests/indexes/datetimes/test_ops.py
@@ -47,6 +47,20 @@ def test_ops_properties_basic(self):
         assert s.day == 10
         pytest.raises(AttributeError, lambda: s.weekday)
 
+    def test_mean(self, tz_naive_fixture):
+        tz = tz_naive_fixture
+        idx1 = pd.DatetimeIndex(['2011-01-01', '2011-01-02',
+                                 '2011-01-03'], tz=tz)
+        assert idx1.mean() == pd.Timestamp('2011-01-02', tz=tz)
+
+        idx2 = pd.DatetimeIndex(['2011-01-01', '2011-01-02', pd.NaT,
+                                 '2011-01-03'], tz=tz)
+        assert idx2.mean(skipna=False) is pd.NaT
+        assert idx2.mean(skipna=True) == pd.Timestamp('2011-01-02', tz=tz)
+
+        idx3 = pd.DatetimeIndex([])
+        assert idx3.mean() is pd.NaT
+
     def test_minmax_tz(self, tz_naive_fixture):
         tz = tz_naive_fixture
         # monotonic