rapidsai · rapids-bot · Apr 21, 2022 · Apr 19, 2022 · Apr 19, 2022 · Apr 20, 2022
@@ -516,7 +516,7 @@ def pipe(self, func, *args, **kwargs):
         """
         return cudf.core.common.pipe(self, func, *args, **kwargs)
 
-    def apply(self, function):
+    def apply(self, function, *args):
         """Apply a python transformation function over the grouped chunk.
 
         Parameters
@@ -594,17 +594,19 @@ def mult(df):
         chunks = [
             grouped_values[s:e] for s, e in zip(offsets[:-1], offsets[1:])
         ]
-        chunk_results = [function(chk) for chk in chunks]
-
+        chunk_results = [function(chk, *args) for chk in chunks]
         if not len(chunk_results):
             return self.obj.head(0)
 
         if cudf.api.types.is_scalar(chunk_results[0]):
             result = cudf.Series(chunk_results, index=group_names)
             result.index.names = self.grouping.names
         elif isinstance(chunk_results[0], cudf.Series):
-            result = cudf.concat(chunk_results, axis=1).T
-            result.index.names = self.grouping.names
+            if isinstance(self.obj, cudf.DataFrame):
+                result = cudf.concat(chunk_results, axis=1).T
+                result.index.names = self.grouping.names
+            else:
+                result = cudf.concat(chunk_results)
         else:
             result = cudf.concat(chunk_results)
 
@@ -1581,8 +1583,8 @@ def agg(self, func):
 
         return result
 
-    def apply(self, func):
-        result = super().apply(func)
+    def apply(self, func, *args):
+        result = super().apply(func, *args)
 
         # apply Series name to result
         result.name = self.obj.name

@@ -291,6 +291,14 @@ def foo(df):
     got = got_grpby.apply(foo)
     assert_groupby_results_equal(expect, got)
 
+    def foo_args(df, k):
+        df["out"] = df["val1"] + df["val2"] + k
+        return df
+
+    expect = expect_grpby.apply(foo_args, 2)
+    got = got_grpby.apply(foo_args, 2)
+    assert_groupby_results_equal(expect, got)
+
 
 def test_groupby_apply_grouped():
     np.random.seed(0)
@@ -1626,6 +1634,17 @@ def custom_map_func(x):
 
     assert_groupby_results_equal(expected, actual)
 
+    def custom_map_func_args(x, k):
+        x = x[~x["B"].isna()]
+        ticker = x.shape[0]
+        full = ticker / 10 + k
+        return full + 1.8 / k
+
+    expected = pdf.groupby("A").apply(custom_map_func_args, 2)
+    actual = gdf.groupby("A").apply(custom_map_func_args, 2)
+
+    assert_groupby_results_equal(expected, actual)
+
 
 @pytest.mark.parametrize(
     "cust_func",
@@ -1643,6 +1662,21 @@ def test_groupby_apply_return_series_dataframe(cust_func):
     assert_groupby_results_equal(expected, actual)
 
 
+def test_groupby_apply_return_series_dataframe_args():
+    pdf = pd.DataFrame(
+        {"key": [0, 0, 1, 1, 2, 2, 2], "val": [0, 1, 2, 3, 4, 5, 6]}
+    )
+    gdf = cudf.from_pandas(pdf)
+
+    def cust_func(x, k):
+        return x - x.min() + k
+
+    expected = pdf.groupby(["key"]).apply(cust_func, 2)
+    actual = gdf.groupby(["key"]).apply(cust_func, 2)
+
+    assert_groupby_results_equal(expected, actual)
+
+
 @pytest.mark.parametrize(
     "pdf",
     [pd.DataFrame(), pd.DataFrame({"a": []}), pd.Series([], dtype="float64")],
@@ -2212,6 +2246,12 @@ def foo(x):
 
     assert_groupby_results_equal(expect, got)
 
+    def foo_args(x, k):
+        return x.sum() + k
+
+    got = make_frame(DataFrame, 100).groupby("x").y.apply(foo_args, 2)
+    expect = make_frame(pd.DataFrame, 100).groupby("x").y.apply(foo_args, 2)
+
 
 @pytest.mark.parametrize("label", [None, "left", "right"])
 @pytest.mark.parametrize("closed", [None, "left", "right"])