rapidsai · rapids-bot · Jun 26, 2025 · Jun 18, 2025 · Jun 18, 2025 · Jun 25, 2025
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2025, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -48,10 +48,8 @@ enum class scan_type : bool { INCLUSIVE, EXCLUSIVE };
  *
  * Any null values are skipped for the operation.
  *
- * If the column is empty or contains all null entries `col.size()==col.null_count()`,
- * the output scalar value will be `false` for reduction type `any` and `true`
- * for reduction type `all`. For all other reductions, the output scalar
- * returns with `is_valid()==false`.
+ * For empty or all-null input, the result is generally a null scalar except for specific
+ * aggregations where the aggregation has a well-defined output.
  *
  * If the input column is an arithmetic type, the `output_dtype` can be any arithmetic
  * type. If the input column is a non-arithmetic type (e.g. timestamp or string)

@@ -38,128 +38,170 @@
 namespace cudf {
 namespace reduction {
 namespace detail {
-struct reduce_dispatch_functor {
-  column_view const col;
-  data_type output_dtype;
-  std::optional<std::reference_wrapper<scalar const>> init;
-  rmm::device_async_resource_ref mr;
-  rmm::cuda_stream_view stream;
-
-  reduce_dispatch_functor(column_view col,
-                          data_type output_dtype,
-                          std::optional<std::reference_wrapper<scalar const>> init,
-                          rmm::cuda_stream_view stream,
-                          rmm::device_async_resource_ref mr)
-    : col(std::move(col)), output_dtype(output_dtype), init(init), mr(mr), stream(stream)
-  {
+namespace {
+
+std::unique_ptr<scalar> reduce_aggregate_impl(
+  reduce_aggregation const& agg,
+  column_view col,
+  data_type output_dtype,
+  std::optional<std::reference_wrapper<scalar const>> init,
+  rmm::cuda_stream_view stream,
+  rmm::device_async_resource_ref mr)
+{
+  switch (agg.kind) {
+    case aggregation::SUM: return sum(col, output_dtype, init, stream, mr);
+    case aggregation::PRODUCT: return product(col, output_dtype, init, stream, mr);
+    case aggregation::MIN: return min(col, output_dtype, init, stream, mr);
+    case aggregation::MAX: return max(col, output_dtype, init, stream, mr);
+    case aggregation::ANY: return any(col, output_dtype, init, stream, mr);
+    case aggregation::ALL: return all(col, output_dtype, init, stream, mr);
+    case aggregation::HISTOGRAM: return histogram(col, stream, mr);
+    case aggregation::MERGE_HISTOGRAM: return merge_histogram(col, stream, mr);
+    case aggregation::SUM_OF_SQUARES: return sum_of_squares(col, output_dtype, stream, mr);
+    case aggregation::MEAN: return mean(col, output_dtype, stream, mr);
+    case aggregation::VARIANCE: {
+      auto var_agg = static_cast<cudf::detail::var_aggregation const&>(agg);
+      return variance(col, output_dtype, var_agg._ddof, stream, mr);
+    }
+    case aggregation::STD: {
+      auto var_agg = static_cast<cudf::detail::std_aggregation const&>(agg);
+      return standard_deviation(col, output_dtype, var_agg._ddof, stream, mr);
+    }
+    case aggregation::MEDIAN: {
+      auto current_mr = cudf::get_current_device_resource_ref();
+      auto sorted_indices =
+        cudf::detail::sorted_order(table_view{{col}}, {}, {null_order::AFTER}, stream, current_mr);
+      auto valid_sorted_indices =
+        cudf::detail::split(*sorted_indices, {col.size() - col.null_count()}, stream)[0];
+      auto col_ptr = cudf::detail::quantile(
+        col, {0.5}, interpolation::LINEAR, valid_sorted_indices, true, stream, current_mr);
+      return cudf::detail::get_element(*col_ptr, 0, stream, mr);
+    }
+    case aggregation::QUANTILE: {
+      auto quantile_agg = static_cast<cudf::detail::quantile_aggregation const&>(agg);
+      CUDF_EXPECTS(quantile_agg._quantiles.size() == 1,
+                   "Reduction quantile accepts only one quantile value");
+      auto current_mr = cudf::get_current_device_resource_ref();
+      auto sorted_indices =
+        cudf::detail::sorted_order(table_view{{col}}, {}, {null_order::AFTER}, stream, current_mr);
+      auto valid_sorted_indices =
+        cudf::detail::split(*sorted_indices, {col.size() - col.null_count()}, stream)[0];
+
+      auto col_ptr = cudf::detail::quantile(col,
+                                            quantile_agg._quantiles,
+                                            quantile_agg._interpolation,
+                                            valid_sorted_indices,
+                                            true,
+                                            stream,
+                                            current_mr);
+      return cudf::detail::get_element(*col_ptr, 0, stream, mr);
+    }
+    case aggregation::NUNIQUE: {
+      auto nunique_agg = static_cast<cudf::detail::nunique_aggregation const&>(agg);
+      return cudf::make_fixed_width_scalar(
+        cudf::detail::distinct_count(
+          col, nunique_agg._null_handling, nan_policy::NAN_IS_VALID, stream),
+        stream,
+        mr);
+    }
+    case aggregation::NTH_ELEMENT: {
+      auto nth_agg = static_cast<cudf::detail::nth_element_aggregation const&>(agg);
+      return nth_element(col, nth_agg._n, nth_agg._null_handling, stream, mr);
+    }
+    case aggregation::COLLECT_LIST: {
+      auto col_agg = static_cast<cudf::detail::collect_list_aggregation const&>(agg);
+      return collect_list(col, col_agg._null_handling, stream, mr);
+    }
+    case aggregation::COLLECT_SET: {
+      auto col_agg = static_cast<cudf::detail::collect_set_aggregation const&>(agg);
+      return collect_set(
+        col, col_agg._null_handling, col_agg._nulls_equal, col_agg._nans_equal, stream, mr);
+    }
+    case aggregation::MERGE_LISTS: {
+      return merge_lists(col, stream, mr);
+    }
+    case aggregation::MERGE_SETS: {
+      auto col_agg = static_cast<cudf::detail::merge_sets_aggregation const&>(agg);
+      return merge_sets(col, col_agg._nulls_equal, col_agg._nans_equal, stream, mr);
+    }
+    case aggregation::TDIGEST: {
+      CUDF_EXPECTS(output_dtype.id() == type_id::STRUCT,
+                   "Tdigest aggregations expect output type to be STRUCT");
+      auto td_agg = static_cast<cudf::detail::tdigest_aggregation const&>(agg);
+      return tdigest::detail::reduce_tdigest(col, td_agg.max_centroids, stream, mr);
+    }
+    case aggregation::MERGE_TDIGEST: {
+      CUDF_EXPECTS(output_dtype.id() == type_id::STRUCT,
+                   "Tdigest aggregations expect output type to be STRUCT");
+      auto td_agg = static_cast<cudf::detail::merge_tdigest_aggregation const&>(agg);
+      return tdigest::detail::reduce_merge_tdigest(col, td_agg.max_centroids, stream, mr);
+    }
+    case aggregation::HOST_UDF: {
+      auto const& udf_base_ptr =
+        dynamic_cast<cudf::detail::host_udf_aggregation const&>(agg).udf_ptr;
+      auto const udf_ptr = dynamic_cast<reduce_host_udf const*>(udf_base_ptr.get());
+      CUDF_EXPECTS(udf_ptr != nullptr, "Invalid HOST_UDF instance for reduction.");
+      return (*udf_ptr)(col, output_dtype, init, stream, mr);
+    }  // case aggregation::HOST_UDF
+    case aggregation::BITWISE_AGG: {
+      auto const bitwise_agg = static_cast<cudf::detail::bitwise_aggregation const&>(agg);
+      return bitwise_reduction(bitwise_agg.bit_op, col, stream, mr);
+    }
+    default: CUDF_FAIL("Unsupported reduction operator");
   }
+}
 
-  template <aggregation::Kind k>
-  std::unique_ptr<scalar> operator()(reduce_aggregation const& agg)
-  {
-    switch (k) {
-      case aggregation::SUM: return sum(col, output_dtype, init, stream, mr);
-      case aggregation::PRODUCT: return product(col, output_dtype, init, stream, mr);
-      case aggregation::MIN: return min(col, output_dtype, init, stream, mr);
-      case aggregation::MAX: return max(col, output_dtype, init, stream, mr);
-      case aggregation::ANY: return any(col, output_dtype, init, stream, mr);
-      case aggregation::ALL: return all(col, output_dtype, init, stream, mr);
-      case aggregation::HISTOGRAM: return histogram(col, stream, mr);
-      case aggregation::MERGE_HISTOGRAM: return merge_histogram(col, stream, mr);
-      case aggregation::SUM_OF_SQUARES: return sum_of_squares(col, output_dtype, stream, mr);
-      case aggregation::MEAN: return mean(col, output_dtype, stream, mr);
-      case aggregation::VARIANCE: {
-        auto var_agg = static_cast<cudf::detail::var_aggregation const&>(agg);
-        return variance(col, output_dtype, var_agg._ddof, stream, mr);
-      }
-      case aggregation::STD: {
-        auto var_agg = static_cast<cudf::detail::std_aggregation const&>(agg);
-        return standard_deviation(col, output_dtype, var_agg._ddof, stream, mr);
-      }
-      case aggregation::MEDIAN: {
-        auto current_mr     = cudf::get_current_device_resource_ref();
-        auto sorted_indices = cudf::detail::sorted_order(
-          table_view{{col}}, {}, {null_order::AFTER}, stream, current_mr);
-        auto valid_sorted_indices =
-          cudf::detail::split(*sorted_indices, {col.size() - col.null_count()}, stream)[0];
-        auto col_ptr = cudf::detail::quantile(
-          col, {0.5}, interpolation::LINEAR, valid_sorted_indices, true, stream, current_mr);
-        return cudf::detail::get_element(*col_ptr, 0, stream, mr);
-      }
-      case aggregation::QUANTILE: {
-        auto quantile_agg = static_cast<cudf::detail::quantile_aggregation const&>(agg);
-        CUDF_EXPECTS(quantile_agg._quantiles.size() == 1,
-                     "Reduction quantile accepts only one quantile value");
-        auto current_mr     = cudf::get_current_device_resource_ref();
-        auto sorted_indices = cudf::detail::sorted_order(
-          table_view{{col}}, {}, {null_order::AFTER}, stream, current_mr);
-        auto valid_sorted_indices =
-          cudf::detail::split(*sorted_indices, {col.size() - col.null_count()}, stream)[0];
-
-        auto col_ptr = cudf::detail::quantile(col,
-                                              quantile_agg._quantiles,
-                                              quantile_agg._interpolation,
-                                              valid_sorted_indices,
-                                              true,
-                                              stream,
-                                              current_mr);
-        return cudf::detail::get_element(*col_ptr, 0, stream, mr);
-      }
-      case aggregation::NUNIQUE: {
-        auto nunique_agg = static_cast<cudf::detail::nunique_aggregation const&>(agg);
-        return cudf::make_fixed_width_scalar(
-          cudf::detail::distinct_count(
-            col, nunique_agg._null_handling, nan_policy::NAN_IS_VALID, stream),
-          stream,
-          mr);
-      }
-      case aggregation::NTH_ELEMENT: {
-        auto nth_agg = static_cast<cudf::detail::nth_element_aggregation const&>(agg);
-        return nth_element(col, nth_agg._n, nth_agg._null_handling, stream, mr);
-      }
-      case aggregation::COLLECT_LIST: {
-        auto col_agg = static_cast<cudf::detail::collect_list_aggregation const&>(agg);
-        return collect_list(col, col_agg._null_handling, stream, mr);
-      }
-      case aggregation::COLLECT_SET: {
-        auto col_agg = static_cast<cudf::detail::collect_set_aggregation const&>(agg);
-        return collect_set(
-          col, col_agg._null_handling, col_agg._nulls_equal, col_agg._nans_equal, stream, mr);
-      }
-      case aggregation::MERGE_LISTS: {
-        return merge_lists(col, stream, mr);
-      }
-      case aggregation::MERGE_SETS: {
-        auto col_agg = static_cast<cudf::detail::merge_sets_aggregation const&>(agg);
-        return merge_sets(col, col_agg._nulls_equal, col_agg._nans_equal, stream, mr);
-      }
-      case aggregation::TDIGEST: {
-        CUDF_EXPECTS(output_dtype.id() == type_id::STRUCT,
-                     "Tdigest aggregations expect output type to be STRUCT");
-        auto td_agg = static_cast<cudf::detail::tdigest_aggregation const&>(agg);
-        return tdigest::detail::reduce_tdigest(col, td_agg.max_centroids, stream, mr);
-      }
-      case aggregation::MERGE_TDIGEST: {
-        CUDF_EXPECTS(output_dtype.id() == type_id::STRUCT,
-                     "Tdigest aggregations expect output type to be STRUCT");
-        auto td_agg = static_cast<cudf::detail::merge_tdigest_aggregation const&>(agg);
-        return tdigest::detail::reduce_merge_tdigest(col, td_agg.max_centroids, stream, mr);
-      }
-      case aggregation::HOST_UDF: {
-        auto const& udf_base_ptr =
-          dynamic_cast<cudf::detail::host_udf_aggregation const&>(agg).udf_ptr;
-        auto const udf_ptr = dynamic_cast<reduce_host_udf const*>(udf_base_ptr.get());
-        CUDF_EXPECTS(udf_ptr != nullptr, "Invalid HOST_UDF instance for reduction.");
-        return (*udf_ptr)(col, output_dtype, init, stream, mr);
-      }  // case aggregation::HOST_UDF
-      case aggregation::BITWISE_AGG: {
-        auto const bitwise_agg = static_cast<cudf::detail::bitwise_aggregation const&>(agg);
-        return bitwise_reduction(bitwise_agg.bit_op, col, stream, mr);
-      }
-      default: CUDF_FAIL("Unsupported reduction operator");
+/**
+ * @brief Specialized implementation for empty or all-null input
+ *
+ * This implementation is used to handle the case where the input column is empty or all null.
+ * It returns a scalar with the appropriate value for the reduction operation.
+ *
+ * @param agg The reduction operation to perform
+ * @param col The input column
+ * @param output_dtype The output data type
+ * @param stream The CUDA stream to use
+ * @param mr The memory resource to use
+ * @return A scalar with the appropriate value for the reduction operation
+ */
+std::unique_ptr<scalar> reduce_no_data_impl(reduce_aggregation const& agg,
+                                            column_view col,
+                                            data_type output_dtype,
+                                            rmm::cuda_stream_view stream,
+                                            rmm::device_async_resource_ref mr)
+{
+  switch (agg.kind) {
+    case aggregation::TDIGEST: [[fallthrough]];
+    case aggregation::MERGE_TDIGEST: return tdigest::detail::make_empty_tdigest_scalar(stream, mr);
+    case aggregation::HISTOGRAM:
+      return std::make_unique<list_scalar>(
+        std::move(*reduction::detail::make_empty_histogram_like(col)), true, stream, mr);
+    case aggregation::MERGE_HISTOGRAM:
+      return std::make_unique<list_scalar>(
+        std::move(*reduction::detail::make_empty_histogram_like(col.child(0))), true, stream, mr);
+    case aggregation::COLLECT_LIST: [[fallthrough]];
+    case aggregation::COLLECT_SET: {
+      auto scalar = make_list_scalar(empty_like(col)->view(), stream, mr);
+      scalar->set_valid_async(false, stream);
+      return scalar;
+    }
+    case aggregation::ANY: [[fallthrough]];
+    case aggregation::ALL: {
+      return std::make_unique<numeric_scalar<bool>>(agg.kind == aggregation::ALL, true, stream, mr);
+    }
+    case aggregation::NUNIQUE: {
+      auto nunique_agg = static_cast<cudf::detail::nunique_aggregation const&>(agg);
+      auto valid = !col.is_empty() && (nunique_agg._null_handling == cudf::null_policy::INCLUDE);
+      return std::make_unique<numeric_scalar<size_type>>(!col.is_empty(), valid, stream, mr);
+    }
+    default: {
+      return cudf::is_nested(output_dtype)
+               ? make_empty_scalar_like(col, stream, mr)
+               : make_default_constructed_scalar(output_dtype, stream, mr);
     }
   }
-};
+}
+}  // namespace
 
 std::unique_ptr<scalar> reduce(column_view const& col,
                                reduce_aggregation const& agg,
@@ -181,40 +223,9 @@ std::unique_ptr<scalar> reduce(column_view const& col,
   }
 
   // Returns default scalar if input column is empty or all null
-  if (col.size() <= col.null_count()) {
-    if (agg.kind == aggregation::TDIGEST || agg.kind == aggregation::MERGE_TDIGEST) {
-      return tdigest::detail::make_empty_tdigest_scalar(stream, mr);
-    }
-
-    if (agg.kind == aggregation::HISTOGRAM) {
-      return std::make_unique<list_scalar>(
-        std::move(*reduction::detail::make_empty_histogram_like(col)), true, stream, mr);
-    }
-    if (agg.kind == aggregation::MERGE_HISTOGRAM) {
-      return std::make_unique<list_scalar>(
-        std::move(*reduction::detail::make_empty_histogram_like(col.child(0))), true, stream, mr);
-    }
-
-    if (agg.kind == aggregation::COLLECT_LIST || agg.kind == aggregation::COLLECT_SET) {
-      auto scalar = make_list_scalar(empty_like(col)->view(), stream, mr);
-      scalar->set_valid_async(false, stream);
-      return scalar;
-    }
-
-    // `make_default_constructed_scalar` does not support nested type.
-    if (cudf::is_nested(output_dtype)) { return make_empty_scalar_like(col, stream, mr); }
-
-    auto result = make_default_constructed_scalar(output_dtype, stream, mr);
-    if (agg.kind == aggregation::ANY || agg.kind == aggregation::ALL) {
-      // empty input should return false for ANY and return true for ALL
-      dynamic_cast<numeric_scalar<bool>*>(result.get())
-        ->set_value(agg.kind == aggregation::ALL, stream);
-    }
-    return result;
-  }
-
-  return cudf::detail::aggregation_dispatcher(
-    agg.kind, reduce_dispatch_functor{col, output_dtype, init, stream, mr}, agg);
+  return (col.size() == col.null_count())
+           ? reduce_no_data_impl(agg, col, output_dtype, stream, mr)
+           : reduce_aggregate_impl(agg, col, output_dtype, init, stream, mr);
 }
 }  // namespace detail
 }  // namespace reduction

@@ -1120,6 +1120,15 @@ TEST_F(ReductionEmptyTest, empty_column)
   result = cudf::reduce(col_nulls, *all_agg, bool_type);
   EXPECT_EQ(result->is_valid(), true);
   EXPECT_EQ(dynamic_cast<cudf::numeric_scalar<bool>*>(result.get())->value(), true);
+
+  auto size_data_type = cudf::data_type(cudf::type_to_id<cudf::size_type>());
+  auto nunique_agg =
+    cudf::make_nunique_aggregation<cudf::reduce_aggregation>(cudf::null_policy::INCLUDE);
+  result = cudf::reduce(col0, *nunique_agg, size_data_type);
+  EXPECT_EQ(result->is_valid(), false);
+  result = cudf::reduce(col_nulls, *nunique_agg, size_data_type);
+  EXPECT_EQ(result->is_valid(), true);
+  EXPECT_EQ(dynamic_cast<cudf::numeric_scalar<cudf::size_type>*>(result.get())->value(), 1);
 }
 
 // ----------------------------------------------------------------------------