pandas-dev · dsaxton · Feb 6, 2020 · Feb 6, 2020 · Feb 6, 2020 · Feb 6, 2020
diff --git a/doc/source/whatsnew/v1.0.2.rst b/doc/source/whatsnew/v1.0.2.rst
@@ -28,6 +28,11 @@ Fixed regressions
 Bug fixes
 ~~~~~~~~~
 
+**ExtensionArray**
+
+- Fixed issue where taking ``min`` or ``max`` of a ``StringArray`` or ``Series`` with ``StringDtype`` type would raise. (:issue:`31746`)
+-
+
 **Categorical**
 
 - Fixed bug where :meth:`Categorical.from_codes` improperly raised a ``ValueError`` when passed nullable integer codes. (:issue:`31779`)
@@ -37,7 +42,9 @@ Bug fixes
 - Using ``pd.NA`` with :meth:`DataFrame.to_json` now correctly outputs a null value instead of an empty object (:issue:`31615`)
 - Fixed bug in parquet roundtrip with nullable unsigned integer dtypes (:issue:`31896`).
 
+**Reduction**
 
+- Fixed bug where :meth:`Series.min` and :meth:`Series.max` would raise a ``TypeError`` in the presence of ``NaN`` for object dtype. (:issue:`18588`)
 
 **Experimental dtypes**
 
@@ -51,4 +58,4 @@ Bug fixes
 Contributors
 ~~~~~~~~~~~~
 
-.. contributors:: v1.0.1..v1.0.2|HEAD
+.. contributors:: v1.0.1..v1.0.2|HEAD
diff --git a/pandas/core/arrays/string_.py b/pandas/core/arrays/string_.py
@@ -4,6 +4,7 @@
 import numpy as np
 
 from pandas._libs import lib, missing as libmissing
+from pandas.compat.numpy import function as nv
 
 from pandas.core.dtypes.base import ExtensionDtype
 from pandas.core.dtypes.common import pandas_dtype
@@ -12,7 +13,7 @@
 from pandas.core.dtypes.inference import is_array_like
 
 from pandas import compat
-from pandas.core import ops
+from pandas.core import nanops, ops
 from pandas.core.arrays import PandasArray
 from pandas.core.construction import extract_array
 from pandas.core.indexers import check_array_indexer
@@ -274,8 +275,21 @@ def astype(self, dtype, copy=True):
  return super().astype(dtype, copy)
 
  def _reduce(self, name, skipna=True, **kwargs):
+ if name in ["min", "max"]:
+ return getattr(self, name)(skipna=skipna, **kwargs)
+
  raise TypeError(f"Cannot perform reduction '{name}' with string dtype")
 
+ def min(self, axis=None, out=None, keepdims=False, skipna=True):
+ nv.validate_min((), dict(out=out, keepdims=keepdims))
+ result = nanops.nanmin(self._ndarray, axis=axis, skipna=skipna, mask=isna(self))
+ return libmissing.NA if isna(result) else result
+
+ def max(self, axis=None, out=None, keepdims=False, skipna=True):
+ nv.validate_max((), dict(out=out, keepdims=keepdims))
+ result = nanops.nanmax(self._ndarray, axis=axis, skipna=skipna, mask=isna(self))
+ return libmissing.NA if isna(result) else result
+
  def value_counts(self, dropna=False):
  from pandas import value_counts
 

diff --git a/pandas/core/nanops.py b/pandas/core/nanops.py
@@ -228,7 +228,9 @@ def _maybe_get_mask(
  # Boolean data cannot contain nulls, so signal via mask being None
  return None
 
- if skipna:
+ if skipna or is_object_dtype(values.dtype):
+ # The masking in nanminmax does not work for object dtype, so always
+ # compute a mask for use later when skipna is False
  mask = isna(values)
 
  return mask
@@ -865,6 +867,17 @@ def reduction(
  result.fill(np.nan)
  except (AttributeError, TypeError, ValueError):
  result = np.nan
+ elif (
+ is_object_dtype(dtype)
+ and values.ndim == 1
+ and mask is not None
+ and mask.any()
+ ):
+ # Need to explicitly mask NA values for object dtypes
+ if skipna:
+ result = getattr(values[~mask], meth)(axis)
+ else:
+ result = np.nan
  else:
  result = getattr(values, meth)(axis)
 

diff --git a/pandas/tests/arrays/string_/test_string.py b/pandas/tests/arrays/string_/test_string.py
@@ -269,3 +269,31 @@ def test_value_counts_na():
  result = arr.value_counts(dropna=True)
  expected = pd.Series([2, 1], index=["a", "b"], dtype="Int64")
  tm.assert_series_equal(result, expected)
+
+
+@pytest.mark.parametrize("func", ["min", "max"])
+@pytest.mark.parametrize("skipna", [True, False])
+def test_reduction(func, skipna):
+ s = pd.Series(["x", "y", "z"], dtype="string")
+ result = getattr(s, func)(skipna=skipna)
+ expected = "x" if func == "min" else "z"
+
+ assert result == expected
+
+
+@pytest.mark.parametrize("func", ["min", "max"])
+@pytest.mark.parametrize("skipna", [True, False])
+@pytest.mark.parametrize("box_in_series", [True, False])
+def test_reduction_with_na(func, skipna, box_in_series):
+ data = pd.array([pd.NA, "y", "z"], dtype="string")
+
+ if box_in_series:
+ data = pd.Series(data)
+
+ result = getattr(data, func)(skipna=skipna)
+
+ if skipna:
+ expected = "y" if func == "min" else "z"
+ assert result == expected
+ else:
+ assert result is pd.NA
diff --git a/pandas/tests/extension/test_string.py b/pandas/tests/extension/test_string.py
@@ -77,7 +77,20 @@ class TestMissing(base.BaseMissingTests):
 
 
 class TestNoReduce(base.BaseNoReduceTests):
- pass
+ @pytest.mark.parametrize("skipna", [True, False])
+ def test_reduce_series_numeric(self, data, all_numeric_reductions, skipna):
+ if isinstance(data, pd.arrays.StringArray) and all_numeric_reductions in [
+ "min",
+ "max",
+ ]:
+ # Tested in pandas/tests/arrays/string_/test_string.py
+ pytest.skip("These reductions are implemented")
+
+ op_name = all_numeric_reductions
+ s = pd.Series(data)
+
+ with pytest.raises(TypeError):
+ getattr(s, op_name)(skipna=skipna)
 
 
 class TestMethods(base.BaseMethodsTests):

diff --git a/pandas/tests/frame/test_apply.py b/pandas/tests/frame/test_apply.py
@@ -1406,8 +1406,8 @@ def test_apply_datetime_tz_issue(self):
  @pytest.mark.parametrize("method", ["min", "max", "sum"])
  def test_consistency_of_aggregates_of_columns_with_missing_values(self, df, method):
  # GH 16832
- none_in_first_column_result = getattr(df[["A", "B"]], method)()
- none_in_second_column_result = getattr(df[["B", "A"]], method)()
+ none_in_first_column_result = getattr(df[["A", "B"]], method)().sort_index()
+ none_in_second_column_result = getattr(df[["B", "A"]], method)().sort_index()
 
  tm.assert_series_equal(
  none_in_first_column_result, none_in_second_column_result

diff --git a/pandas/tests/reductions/test_reductions.py b/pandas/tests/reductions/test_reductions.py
@@ -168,6 +168,19 @@ def test_numpy_reduction_with_tz_aware_dtype(self, tz_aware_fixture, func):
  result = getattr(np, func)(expected, expected)
  tm.assert_series_equal(result, expected)
 
+ @pytest.mark.parametrize("func", ["min", "max"])
+ @pytest.mark.parametrize("skipna", [True, False])
+ def test_reduce_object_with_na(self, func, skipna):
+ # https://github.com/pandas-dev/pandas/issues/18588
+ s = pd.Series(np.array(["a", "b", np.nan], dtype=object))
+ result = getattr(s, func)(skipna=skipna)
+
+ if skipna:
+ expected = "a" if func == "min" else "b"
+ assert result == expected
+ else:
+ assert result is np.nan
+
 
 class TestIndexReductions:
  # Note: the name TestIndexReductions indicates these tests