rapidsai · rapids-bot · May 8, 2025 · May 2, 2025 · May 6, 2025 · May 7, 2025
@@ -7,17 +7,20 @@
 from typing import TYPE_CHECKING
 
 import dask.dataframe as dd
+import numpy as np
 from dask.tokenize import tokenize
+from dask.utils import M
 
 import rmm.mr
 from rmm.pylibrmm.stream import DEFAULT_STREAM
 
 from rapidsmpf.integrations.dask.shuffler import rapidsmpf_shuffle_graph
-from rapidsmpf.shuffler import partition_and_pack, unpack_and_concat
+from rapidsmpf.shuffler import partition_and_pack, split_and_pack, unpack_and_concat
 from rapidsmpf.testing import pylibcudf_to_cudf_dataframe
 
 if TYPE_CHECKING:
     from collections.abc import Sequence
+    from typing import Any
 
     import dask_cudf
 
@@ -45,6 +48,8 @@ def insert_partition(
         on: Sequence[str],
         partition_count: int,
         shuffler: Shuffler,
+        sort_boundaries: cudf.DataFrame | None,
+        options: dict[str, Any] | None,
     ) -> None:
         """
         Add cudf DataFrame chunks to an RMPF shuffler.
@@ -59,22 +64,39 @@ def insert_partition(
             Number of output partitions for the current shuffle.
         shuffler
             The RapidsMPF Shuffler object to extract from.
+        sort_boundaries
+            Output partition boundaries for sorting.
+        options
+            Optional key-work arguments.
-            Optional key-work arguments.
+            Optional key-word arguments.
-            Optional key-work arguments.
+            Optional key-word arguments.
         """
-        columns_to_hash = tuple(list(df.columns).index(val) for val in on)
-        packed_inputs = partition_and_pack(
-            df.to_pylibcudf()[0],
-            columns_to_hash=columns_to_hash,
-            num_partitions=partition_count,
-            stream=DEFAULT_STREAM,
-            device_mr=rmm.mr.get_current_device_resource(),
-        )
+        if options:
+            raise ValueError(f"Unsupported options: {options}")
+        if sort_boundaries is None:
+            columns_to_hash = tuple(list(df.columns).index(val) for val in on)
+            packed_inputs = partition_and_pack(
+                df.to_pylibcudf()[0],
+                columns_to_hash=columns_to_hash,
+                num_partitions=partition_count,
+                stream=DEFAULT_STREAM,
+                device_mr=rmm.mr.get_current_device_resource(),
+            )
+        else:
+            df = df.sort_values(on)
+            splits = df[on[0]].searchsorted(sort_boundaries, side="right")
+            packed_inputs = split_and_pack(
+                df.to_pylibcudf()[0],
+                splits.tolist(),
+                stream=DEFAULT_STREAM,
+                device_mr=rmm.mr.get_current_device_resource(),
+            )
         shuffler.insert_chunks(packed_inputs)
 
     @staticmethod
     def extract_partition(
         partition_id: int,
         column_names: list[str],
         shuffler: Shuffler,
+        options: dict[str, Any] | None,
     ) -> cudf.DataFrame:
         """
         Extract a finished partition from the RMPF shuffler.
@@ -87,11 +109,15 @@ def extract_partition(
             Sequence of output column names.
         shuffler
             The RapidsMPF Shuffler object to extract from.
+        options
+            Additional options.
 
         Returns
         -------
         A shuffled DataFrame partition.
         """
+        if options:
+            raise ValueError(f"Unsupported options: {options}")
         shuffler.wait_on(partition_id)
         table = unpack_and_concat(
             shuffler.extract(partition_id),
@@ -108,6 +134,7 @@ def dask_cudf_shuffle(
     df: dask_cudf.DataFrame,
     shuffle_on: list[str],
     *,
+    sort: bool = False,
     partition_count: int | None = None,
 ) -> dask_cudf.DataFrame:
     """
@@ -119,6 +146,10 @@ def dask_cudf_shuffle(
         Input `dask_cudf.DataFrame` collection.
     shuffle_on
         List of column names to shuffle on.
+    sort
+        Whether the output partitioning should be in
+        sorted order. The first column in ``shuffle_on``
+        must be numerical.
     partition_count
         Output partition count. Default will preserve
         the input partition count.
@@ -133,6 +164,13 @@ def dask_cudf_shuffle(
     token = tokenize(df0, shuffle_on, count_out)
     name_in = df0._name
     name_out = f"shuffle-{token}"
+    if sort:
+        boundaries = (
+            df0[shuffle_on[0]].quantile(np.linspace(0.0, 1.0, count_out)[1:]).optimize()
+        )
+        sort_boundaries_name = (boundaries._name, 0)
+    else:
+        sort_boundaries_name = None
     graph = rapidsmpf_shuffle_graph(
         name_in,
         name_out,
@@ -141,16 +179,28 @@ def dask_cudf_shuffle(
         count_in,
         count_out,
         DaskCudfIntegration,
+        sort_boundaries_name=sort_boundaries_name,
     )
 
     # Add df0 dependencies to the task graph
     graph.update(df0.dask)
+    if sort:
+        graph.update(boundaries.dask)
 
-    # Return a Dask-DataFrame collection
-    return dd.from_graph(
+    shuffled = dd.from_graph(
         graph,
         df0._meta,
         (None,) * (count_out + 1),
         [(name_out, pid) for pid in range(count_out)],
         "rapidsmpf",
     )
+
+    # Return a Dask-DataFrame collection
+    if sort:
+        return shuffled.map_partitions(
+            M.sort_values,
+            shuffle_on,
+            meta=shuffled._meta,
+        )
+    else:
+        return shuffled
@@ -111,6 +111,8 @@ def insert_partition(
         on: Sequence[str],
         partition_count: int,
         shuffler: Shuffler,
+        sort_boundaries: DataFrameT | None,
+        options: dict[str, Any] | None,
     ) -> None:
         """
         Add a partition to a RapidsMPF Shuffler.
@@ -125,13 +127,19 @@ def insert_partition(
             Number of output partitions for the current shuffle.
         shuffler
             The RapidsMPF Shuffler object to extract from.
+        sort_boundaries
+            Output partition boundaries for sorting. If None,
+            hashing will be used to calculate output partitions.
+        options
+            Additional options.
         """
 
     @staticmethod
     def extract_partition(
         partition_id: int,
         column_names: list[str],
         shuffler: Shuffler,
+        options: dict[str, Any] | None,
     ) -> DataFrameT:
         """
         Extract a DataFrame partition from a RapidsMPF Shuffler.
@@ -144,6 +152,8 @@ def extract_partition(
             Sequence of output column names.
         shuffler
             The RapidsMPF Shuffler object to extract from.
+        options
+            Additional options.
 
         Returns
         -------
@@ -214,11 +224,23 @@ def _stage_shuffler(
 
 
 def _insert_partition(
-    callback: Callable[[DataFrameT, Sequence[str], int, Shuffler], None],
+    callback: Callable[
+        [
+            DataFrameT,
+            Sequence[str],
+            int,
+            Shuffler,
+            str | tuple[str, int] | None,
+            dict[str, Any],
+        ],
+        None,
+    ],
     df: DataFrameT,
     on: Sequence[str],
     partition_count: int,
     shuffle_id: int,
+    sort_boundaries_name: str | tuple[str, int] | None,
+    options: dict[str, Any],
 ) -> None:
     """
     Add a partition to a RapidsMPF Shuffler.
@@ -237,6 +259,11 @@ def _insert_partition(
         Number of output partitions for the current shuffle.
     shuffle_id
         The RapidsMPF shuffle id.
+    sort_boundaries_name
+        The task name for sorting boundaries. Only needed
+        if the shuffle is in service of a sort operation.
+    options
+        Optional key-word arguments.
     """
     if callback is None:
         raise ValueError("callback missing in _insert_partition.")
@@ -247,15 +274,21 @@ def _insert_partition(
         on,
         partition_count,
         get_shuffler(shuffle_id),
+        sort_boundaries_name,
+        options,
     )
 
 
 def _extract_partition(
-    callback: Callable[[int, Sequence[str], Shuffler], DataFrameT],
+    callback: Callable[
+        [int, Sequence[str], Shuffler, dict[str, Any] | None],
+        DataFrameT,
+    ],
     shuffle_id: int,
     partition_id: int,
     column_names: list[str],
     worker_barrier: tuple[int, ...],
+    options: dict[str, Any] | None,
 ) -> DataFrameT:
     """
     Extract a partition from a RapidsMPF Shuffler.
@@ -275,6 +308,8 @@ def _extract_partition(
     worker_barrier
         Worker-barrier task dependency. This value should
         not be used for compute logic.
+    options
+        Additional options.
 
     Returns
     -------
@@ -286,6 +321,7 @@ def _extract_partition(
         partition_id,
         column_names,
         get_shuffler(shuffle_id),
+        options,
     )
 
 
@@ -297,6 +333,9 @@ def rapidsmpf_shuffle_graph(
     partition_count_in: int,
     partition_count_out: int,
     integration: DaskIntegration,
+    *,
+    sort_boundaries_name: str | tuple[str, int] | None = None,
+    options: dict[str, Any] | None = None,
 ) -> dict[Any, Any]:
     """
     Return the task graph for a RapidsMPF shuffle.
@@ -310,13 +349,23 @@ def rapidsmpf_shuffle_graph(
     column_names
         Sequence of output column names.
     shuffle_on
-        Sequence of column names to shuffle on (by hash).
+        Sequence of column names to shuffle on. Output
+        partitions will be based on the hash of these
+        columns, unless ``sort_boundaries_name`` is
+        specified. In the case of sorting, output
+        partitioning will be based on the first element
+        of ``shuffle_on`` only.
     partition_count_in
         Partition count of input collection.
     partition_count_out
         Partition count of output collection.
     integration
         Dask-integration specification.
+    sort_boundaries_name
+        The task name for sorting boundaries. Only needed
+        if the shuffle is in service of a sort operation.
+    options
+        Optional key-word arguments.
 
     Returns
     -------
@@ -422,6 +471,8 @@ def rapidsmpf_shuffle_graph(
             shuffle_on,
             partition_count_out,
             shuffle_id,
+            sort_boundaries_name,
+            options,
         )
         for pid in range(partition_count_in)
     }
@@ -463,6 +514,7 @@ def rapidsmpf_shuffle_graph(
             part_id,
             column_names,
             (global_barrier_2_name, 0),
+            options,
         )
         # Assume round-robin partition assignment
         restricted_keys[output_keys[-1]] = worker_ranks[rank]

@@ -63,7 +63,12 @@ def get_rank(dask_worker: Worker) -> int:
 
 
 @pytest.mark.parametrize("partition_count", [None, 3])
-def test_dask_cudf_integration(loop: pytest.FixtureDef, partition_count: int) -> None:  # noqa: F811
+@pytest.mark.parametrize("sort", [True, False])
+def test_dask_cudf_integration(
+    loop: pytest.FixtureDef,  # noqa: F811
+    partition_count: int,
+    sort: bool,  # noqa: FBT001
+) -> None:
     # Test basic Dask-cuDF integration
     pytest.importorskip("dask_cudf")
 
@@ -83,14 +88,18 @@ def test_dask_cudf_integration(loop: pytest.FixtureDef, partition_count: int) ->
                 .to_backend("cudf")
             )
             partition_count_in = df.npartitions
-            expect = df.compute().sort_values(["x", "y"])
+            expect = df.compute().sort_values(["id", "name", "x", "y"])
             shuffled = dask_cudf_shuffle(
                 df,
-                ["name", "id"],
+                ["id", "name"],
+                sort=sort,
                 partition_count=partition_count,
             )
             assert shuffled.npartitions == (partition_count or partition_count_in)
-            got = shuffled.compute().sort_values(["x", "y"])
+            got = shuffled.compute()
+            if sort:
+                assert got["id"].is_monotonic_increasing
+            got = got.sort_values(["id", "name", "x", "y"])
 
             dd.assert_eq(expect, got, check_index=False)