pandas-dev · rhshadrach · Jun 5, 2023 · May 25, 2023 · May 26, 2023 · May 26, 2023
diff --git a/doc/source/whatsnew/v2.1.0.rst b/doc/source/whatsnew/v2.1.0.rst
@@ -99,6 +99,7 @@ Other enhancements
 - :meth:`Categorical.from_codes` has gotten a ``validate`` parameter (:issue:`50975`)
 - :meth:`DataFrame.stack` gained the ``sort`` keyword to dictate whether the resulting :class:`MultiIndex` levels are sorted (:issue:`15105`)
 - Added ``engine_kwargs`` parameter to :meth:`DataFrame.to_excel` (:issue:`53220`)
+- Added a new parameter ``array_ops_only`` to :meth:`Series.apply`. When set to ``True`` the supplied callables will always operate on the whole Series (:issue:`53400`).
 - Performance improvement in :func:`concat` with homogeneous ``np.float64`` or ``np.float32`` dtypes (:issue:`52685`)
 - Performance improvement in :meth:`DataFrame.filter` when ``items`` is given (:issue:`52941`)
 -

diff --git a/pandas/core/apply.py b/pandas/core/apply.py
@@ -16,6 +16,7 @@
  Iterable,
  Iterator,
  List,
+ Literal,
  Sequence,
  cast,
 )
@@ -288,6 +289,11 @@ def agg_list_like(self) -> DataFrame | Series:
  -------
  Result of aggregation.
  """
+ return self.agg_or_apply_list_like(op_name="agg")
+
+ def agg_or_apply_list_like(
+ self, op_name: Literal["agg", "apply"]
+ ) -> DataFrame | Series:
  from pandas.core.groupby.generic import (
  DataFrameGroupBy,
  SeriesGroupBy,
@@ -296,6 +302,9 @@ def agg_list_like(self) -> DataFrame | Series:
 
  obj = self.obj
  func = cast(List[AggFuncTypeBase], self.func)
+ kwargs = self.kwargs
+ if op_name == "apply":
+ kwargs = {**kwargs, "by_row": False}
 
  if getattr(obj, "axis", 0) == 1:
  raise NotImplementedError("axis other than 0 is not supported")
@@ -313,8 +322,6 @@ def agg_list_like(self) -> DataFrame | Series:
  keys = []
 
  is_groupby = isinstance(obj, (DataFrameGroupBy, SeriesGroupBy))
- is_ser_or_df = isinstance(obj, (ABCDataFrame, ABCSeries))
- this_args = [self.axis, *self.args] if is_ser_or_df else self.args
 
  context_manager: ContextManager
  if is_groupby:
@@ -323,12 +330,19 @@ def agg_list_like(self) -> DataFrame | Series:
  context_manager = com.temp_setattr(obj, "as_index", True)
  else:
  context_manager = nullcontext()
+
+ def include_axis(colg) -> bool:
+ return isinstance(colg, ABCDataFrame) or (
+ isinstance(colg, ABCSeries) and op_name == "agg"
+ )
+
  with context_manager:
  # degenerate case
  if selected_obj.ndim == 1:
  for a in func:
  colg = obj._gotitem(selected_obj.name, ndim=1, subset=selected_obj)
- new_res = colg.aggregate(a, *this_args, **self.kwargs)
+ args = [self.axis, *self.args] if include_axis(colg) else self.args
+ new_res = getattr(colg, op_name)(a, *args, **kwargs)
  results.append(new_res)
 
  # make sure we find a good name
@@ -339,7 +353,8 @@ def agg_list_like(self) -> DataFrame | Series:
  indices = []
  for index, col in enumerate(selected_obj):
  colg = obj._gotitem(col, ndim=1, subset=selected_obj.iloc[:, index])
- new_res = colg.aggregate(func, *this_args, **self.kwargs)
+ args = [self.axis, *self.args] if include_axis(colg) else self.args
+ new_res = getattr(colg, op_name)(func, *args, **kwargs)
  results.append(new_res)
  indices.append(index)
  keys = selected_obj.columns.take(indices)
@@ -366,15 +381,21 @@ def agg_dict_like(self) -> DataFrame | Series:
  -------
  Result of aggregation.
  """
+ return self._apply_dict_like(op_name="agg")
+
+ def _apply_dict_like(self, op_name: Literal["agg", "apply"]) -> DataFrame | Series:
  from pandas import Index
  from pandas.core.groupby.generic import (
  DataFrameGroupBy,
  SeriesGroupBy,
  )
  from pandas.core.reshape.concat import concat
 
+ assert op_name in ["agg", "apply"]
+
  obj = self.obj
  func = cast(AggFuncTypeDict, self.func)
+ kwds = {"by_row": False} if op_name == "apply" else {}
 
  if getattr(obj, "axis", 0) == 1:
  raise NotImplementedError("axis other than 0 is not supported")
@@ -387,7 +408,7 @@ def agg_dict_like(self) -> DataFrame | Series:
  selected_obj = obj._selected_obj
  selection = obj._selection
 
- func = self.normalize_dictlike_arg("agg", selected_obj, func)
+ func = self.normalize_dictlike_arg(op_name, selected_obj, func)
 
  is_groupby = isinstance(obj, (DataFrameGroupBy, SeriesGroupBy))
  context_manager: ContextManager
@@ -407,7 +428,9 @@ def agg_dict_like(self) -> DataFrame | Series:
  if selected_obj.ndim == 1:
  # key only used for output
  colg = obj._gotitem(selection, ndim=1)
- result_data = [colg.agg(how) for _, how in func.items()]
+ result_data = [
+ getattr(colg, op_name)(how, **kwds) for _, how in func.items()
+ ]
  result_index = list(func.keys())
  elif is_non_unique_col:
  # key used for column selection and output
@@ -422,7 +445,7 @@ def agg_dict_like(self) -> DataFrame | Series:
  label_to_indices[label].append(index)
 
  key_data = [
- selected_obj._ixs(indice, axis=1).agg(how)
+ getattr(selected_obj._ixs(indice, axis=1), op_name)(how, **kwds)
  for label, indices in label_to_indices.items()
  for indice in indices
  ]
@@ -432,7 +455,8 @@ def agg_dict_like(self) -> DataFrame | Series:
  else:
  # key used for column selection and output
  result_data = [
- obj._gotitem(key, ndim=1).agg(how) for key, how in func.items()
+ getattr(obj._gotitem(key, ndim=1), op_name)(how)
+ for key, how in func.items()
  ]
  result_index = list(func.keys())
 
@@ -527,7 +551,7 @@ def apply_str(self) -> DataFrame | Series:
  self.kwargs["axis"] = self.axis
  return self._apply_str(obj, func, *self.args, **self.kwargs)
 
- def apply_multiple(self) -> DataFrame | Series:
+ def apply_list_or_dict_like(self) -> DataFrame | Series:
  """
  Compute apply in case of a list-like or dict-like.
 
@@ -543,9 +567,9 @@ def apply_multiple(self) -> DataFrame | Series:
  kwargs = self.kwargs
 
  if is_dict_like(func):
- result = self.agg_dict_like()
+ result = self._apply_dict_like(op_name="apply")
  else:
- result = self.agg_list_like()
+ result = self.agg_or_apply_list_like(op_name="apply")
 
  result = reconstruct_and_relabel_result(result, func, **kwargs)
 
@@ -685,8 +709,8 @@ def values(self):
  def apply(self) -> DataFrame | Series:
  """compute the results"""
  # dispatch to agg
- if is_list_like(self.func):
- return self.apply_multiple()
+ if is_list_like(self.func) or is_dict_like(self.func):
+ return self.apply_list_or_dict_like()
 
  # all empty
  if len(self.columns) == 0 and len(self.index) == 0:
@@ -1033,13 +1057,15 @@ def infer_to_same_shape(self, results: ResType, res_index: Index) -> DataFrame:
 class SeriesApply(NDFrameApply):
  obj: Series
  axis: AxisInt = 0
+ by_row: bool # only relevant for apply()
 
  def __init__(
  self,
  obj: Series,
  func: AggFuncType,
  *,
  convert_dtype: bool | lib.NoDefault = lib.no_default,
+ by_row: bool = True,
  args,
  kwargs,
  ) -> None:
@@ -1054,6 +1080,7 @@ def __init__(
  stacklevel=find_stack_level(),
  )
  self.convert_dtype = convert_dtype
+ self.by_row = by_row
 
  super().__init__(
  obj,
@@ -1071,8 +1098,8 @@ def apply(self) -> DataFrame | Series:
  return self.apply_empty_result()
 
  # dispatch to agg
- if is_list_like(self.func):
- return self.apply_multiple()
+ if is_list_like(self.func) or is_dict_like(self.func):
+ return self.apply_list_or_dict_like()
 
  if isinstance(self.func, str):
  # if we are a string, try to dispatch
@@ -1118,6 +1145,8 @@ def apply_standard(self) -> DataFrame | Series:
  if isinstance(func, np.ufunc):
  with np.errstate(all="ignore"):
  return func(obj, *self.args, **self.kwargs)
+ elif not self.by_row:
+ return func(obj, *self.args, **self.kwargs)
 
  if self.args or self.kwargs:
  # _map_values does not support args/kwargs

diff --git a/pandas/core/series.py b/pandas/core/series.py
@@ -4492,6 +4492,8 @@ def apply(
  func: AggFuncType,
  convert_dtype: bool | lib.NoDefault = lib.no_default,
  args: tuple[Any, ...] = (),
+ *,
+ by_row: bool = True,
  **kwargs,
  ) -> DataFrame | Series:
  """
@@ -4519,6 +4521,12 @@ def apply(
  instead if you want ``convert_dtype=False``.
  args : tuple
  Positional arguments passed to func after the series value.
+ by_row : bool, default True
+ If False, the func will be passed the whole Series at once.
+ If True, will func will be passed each element of the Series, like
+ Series.map (backward compatible).
+
+ .. versionadded:: 2.1.0
  **kwargs
  Additional keyword arguments passed to func.
 
@@ -4607,7 +4615,12 @@ def apply(
  dtype: float64
  """
  return SeriesApply(
- self, func, convert_dtype=convert_dtype, args=args, kwargs=kwargs
+ self,
+ func,
+ convert_dtype=convert_dtype,
+ by_row=by_row,
+ args=args,
+ kwargs=kwargs,
  ).apply()
 
  def _reindex_indexer(

diff --git a/pandas/tests/apply/test_series_apply.py b/pandas/tests/apply/test_series_apply.py
@@ -535,6 +535,20 @@ def test_apply_listlike_transformer(string_series, ops, names):
  tm.assert_frame_equal(result, expected)
 
 
+@pytest.mark.parametrize(
+ "ops, expected",
+ [
+ ([lambda x: x], DataFrame({"<lambda>": [1, 2, 3]})),
+ ([lambda x: x.sum()], Series([6], index=["<lambda>"])),
+ ],
+)
+def test_apply_listlike_lambda(ops, expected):
+ # GH53400
+ ser = Series([1, 2, 3])
+ result = ser.apply(ops)
+ tm.assert_equal(result, expected)
+
+
 @pytest.mark.parametrize(
  "ops",
  [