NVIDIA · wjxiz1992 · Apr 16, 2026 · Apr 17, 2026 · Apr 17, 2026 · Apr 17, 2026
diff --git a/src/main/cpp/CMakeLists.txt b/src/main/cpp/CMakeLists.txt
@@ -202,6 +202,7 @@ add_library(
   src/KudoGpuSerializerJni.cpp
   src/ListSliceJni.cpp
   src/MapJni.cpp
+  src/MapUtilsJni.cpp
   src/MapZipWithUtilsJNI.cpp
   src/JoinPrimitivesJni.cpp
   src/NativeParquetJni.cpp
@@ -252,6 +253,7 @@ add_library(
   src/join_primitives.cu
   src/list_slice.cu
   src/map.cu
+  src/map_utils.cpp
   src/map_zip_with_utils.cu
   src/multiply.cu
   src/number_converter.cu

diff --git a/src/main/cpp/src/MapUtilsJni.cpp b/src/main/cpp/src/MapUtilsJni.cpp
@@ -0,0 +1,37 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "cudf_jni_apis.hpp"
+#include "jni_utils.hpp"
+#include "map_utils.hpp"
+
+extern "C" {
+
+JNIEXPORT jlong JNICALL Java_com_nvidia_spark_rapids_jni_MapUtils_mapFromEntries(
+  JNIEnv* env, jclass, jlong input_handle, jboolean throw_on_null_key)
+{
+  JNI_NULL_CHECK(env, input_handle, "input column is null", 0);
+  JNI_TRY
+  {
+    cudf::jni::auto_set_device(env);
+    auto const& input = *reinterpret_cast<cudf::column_view const*>(input_handle);
+    return cudf::jni::release_as_jlong(
+      spark_rapids_jni::map_from_entries(input, static_cast<bool>(throw_on_null_key)));
+  }
+  JNI_CATCH(env, 0);
+}
+
+}  // extern "C"
diff --git a/src/main/cpp/src/map_utils.cpp b/src/main/cpp/src/map_utils.cpp
@@ -0,0 +1,248 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "map_utils.hpp"
+
+#include "nvtx_ranges.hpp"
+
+#include <cudf/aggregation.hpp>
+#include <cudf/binaryop.hpp>
+#include <cudf/column/column.hpp>
+#include <cudf/column/column_factories.hpp>
+#include <cudf/copying.hpp>
+#include <cudf/lists/contains.hpp>
+#include <cudf/lists/lists_column_view.hpp>
+#include <cudf/null_mask.hpp>
+#include <cudf/reduction.hpp>
+#include <cudf/scalar/scalar.hpp>
+#include <cudf/transform.hpp>
+#include <cudf/unary.hpp>
+#include <cudf/utilities/default_stream.hpp>
+#include <cudf/utilities/error.hpp>
+#include <cudf/utilities/memory_resource.hpp>
+#include <cudf/utilities/span.hpp>
+
+#include <rmm/cuda_stream_view.hpp>
+#include <rmm/device_buffer.hpp>
+#include <rmm/resource_ref.hpp>
+
+#include <vector>
+
+namespace spark_rapids_jni {
+
+namespace {
+// Extract a bool from a BOOL8 reduce scalar; returns false if scalar is null (empty-column case).
+// Each of is_valid(stream) and value(stream) performs a blocking device→host copy.
+// Two syncs per call; acceptable because the scalar is small and syncs are rare.
+auto bool_scalar_value(std::unique_ptr<cudf::scalar> const& s, rmm::cuda_stream_view stream) -> bool
+{
+  return s->is_valid(stream) &&
+         static_cast<cudf::numeric_scalar<bool> const*>(s.get())->value(stream);
+}
+
+// Reduce a BOOL8 column to a single bool via ANY aggregation.
+// Returns false when the column is empty (scalar is null).
+auto reduce_any(cudf::column_view const& col,
+                rmm::cuda_stream_view stream,
+                rmm::device_async_resource_ref mr) -> bool
+{
+  auto s = cudf::reduce(col,
+                        *cudf::make_any_aggregation<cudf::reduce_aggregation>(),
+                        cudf::data_type{cudf::type_id::BOOL8},
+                        stream,
+                        mr);
+  return bool_scalar_value(s, stream);
+}
+
+// Error message used by both fast-path and slow-path null-key checks.
+constexpr char null_key_error[] = "Cannot use null as map key.";
+
+// Returns true iff any row has a null-key entry AND passes the per-row guard.
+// Shared by fast path (guard = is_valid(input)) and slow path (guard = no_null_entry):
+//   1. segmented_reduce(MAX) over the per-entry null-key flags → per-row row_has_null_key
+//   2. row_has_null_key AND guard → row_throw
+//   3. reduce_any(row_throw) → final bool
+auto any_null_key_in_guarded_row(cudf::column_view const& entry_is_null_key,
+                                 cudf::device_span<cudf::size_type const> offsets_span,
+                                 cudf::column_view const& guard,
+                                 rmm::cuda_stream_view stream,
+                                 rmm::device_async_resource_ref mr) -> bool
+{
+  auto row_has_null_key =
+    cudf::segmented_reduce(entry_is_null_key,
+                           offsets_span,
+                           *cudf::make_max_aggregation<cudf::segmented_reduce_aggregation>(),
+                           cudf::data_type{cudf::type_id::BOOL8},
+                           cudf::null_policy::EXCLUDE,
+                           stream,
+                           mr);
+  auto row_throw = cudf::binary_operation(*row_has_null_key,
+                                          guard,
+                                          cudf::binary_operator::LOGICAL_AND,
+                                          cudf::data_type{cudf::type_id::BOOL8},
+                                          stream,
+                                          mr);
+  return reduce_any(*row_throw, stream, mr);
+}
+}  // namespace
+
+std::unique_ptr<cudf::column> map_from_entries(cudf::column_view const& input,
+                                               bool throw_on_null_key,
+                                               rmm::cuda_stream_view stream,
+                                               rmm::device_async_resource_ref mr)
+{
+  SRJ_FUNC_RANGE();
+  CUDF_EXPECTS(input.type().id() == cudf::type_id::LIST,
+               "map_from_entries: input must be a LIST column");
+
+  // Validate the nested child shape before the zero-row early return so the documented
+  // LIST(STRUCT(KEY, VALUE)) contract is enforced uniformly — an empty LIST<non-STRUCT>
+  // or LIST<STRUCT<wrong arity>> would otherwise slip through without error.
+  auto const lists_cv = cudf::lists_column_view(input);
+  auto const structs  = lists_cv.child();
+  CUDF_EXPECTS(structs.type().id() == cudf::type_id::STRUCT,
+               "map_from_entries: list child must be a STRUCT column");
+  CUDF_EXPECTS(structs.num_children() == 2,
+               "map_from_entries: struct must have exactly 2 children (KEY, VALUE)");
+
+  if (input.size() == 0) { return cudf::empty_like(input); }
+
+  // Use the default resource for all temporaries; only the output column uses mr.
+  auto const temp_mr = cudf::get_current_device_resource_ref();
+
+  // Per-row flag: does row i contain any null struct entry?
+  // contains_nulls returns BOOL8 of size input.size(); null for outer-null rows.
+  auto has_null_entry = cudf::lists::contains_nulls(lists_cv, stream, temp_mr);
+
+  // Slice-correct offsets span: covers exactly the visible rows of this (potentially sliced)
+  // input. offsets_begin() accounts for input.offset(), so the span is valid for sliced columns.
+  auto const offsets_span = cudf::device_span<cudf::size_type const>(
+    lists_cv.offsets_begin(), static_cast<std::size_t>(input.size()) + 1);
+
+  // Fast path: no null struct entries anywhere — simple global null-key check.
+  bool const any_null_entry = reduce_any(*has_null_entry, stream, temp_mr);
+
+  if (!any_null_entry) {
+    // All struct entries are valid. Use segmented_reduce over the slice-correct offsets to
+    // check for null keys — structs.child(0) is the un-sliced underlying column, so
+    // keys.null_count() would count nulls outside the visible slice range.
+    // Outer-null LIST rows satisfy cudf's invariant of empty child segments
+    // (offsets[i]==offsets[i+1]), so they contribute zero keys to the child column and cannot
+    // inflate null_count().
+    //
+    // SAFETY: keys is structs.child(0) from a cudf lists column; any column constructed via the
+    // public cudf API has a materialized null_count (not UNKNOWN_NULL_COUNT), so null_count()
+    // here is a concrete integer — a sentinel value would indicate a cudf bug, not a case we
+    // need to guard against.
+    auto const keys = structs.child(0);
+    if (throw_on_null_key && keys.nullable() && keys.null_count() > 0) {
+      // Guard is is_valid(input): outer-null rows must not trigger a throw.
+      auto key_is_null    = cudf::is_null(keys, stream, temp_mr);
+      auto input_is_valid = cudf::is_valid(input, stream, temp_mr);
+      if (any_null_key_in_guarded_row(
+            *key_is_null, offsets_span, *input_is_valid, stream, temp_mr)) {
+        throw cudf::logic_error(null_key_error);
+      }
+    }
+    return std::make_unique<cudf::column>(input, stream, mr);
+  }
+
+  // Slow path: at least one row contains a null struct entry.
+  //
+  // CPU semantics: if a row's array has any null struct entry the entire output row is null,
+  // regardless of whether another entry in that row also has a null key.  We must therefore
+  // throw "Cannot use null as map key" only for rows that satisfy BOTH:
+  //   (a) the row has NO null struct entry  (has_null_entry = false), AND
+  //   (b) at least one entry's key is null inside a valid (non-null) struct.
+  //
+  // NOT(has_null_entry): true for rows whose struct entries are all valid.
+  // Used as both the throw guard and the output null mask.  bools_to_mask treats NULL inputs
+  // as false, so outer-null rows (where has_null_entry is null) are correctly masked to null
+  // in the output.
+  auto no_null_entry =
+    cudf::unary_operation(*has_null_entry, cudf::unary_operator::NOT, stream, temp_mr);
+
+  // Throw only when: row has no null struct entry AND row has a null key.  For rows that
+  // contain a null struct entry the guard is false, so their entries are ignored; we also
+  // don't need to mask null-struct positions out of key_is_null before the segmented reduce
+  // because the per-row guard short-circuits any contribution from those rows.
+  // Gate on keys.nullable() && keys.null_count() > 0 to mirror the fast-path guard — when
+  // the key column has no nulls there is no throw to perform, so the BOOL8 alloc + kernel
+  // launches + device→host syncs can be skipped entirely.
+  if (throw_on_null_key) {
+    auto const keys = structs.child(0);
+    if (keys.nullable() && keys.null_count() > 0) {
+      auto key_is_null = cudf::is_null(keys, stream, temp_mr);
+      if (any_null_key_in_guarded_row(
+            *key_is_null, offsets_span, *no_null_entry, stream, temp_mr)) {
+        throw cudf::logic_error(null_key_error);
+      }
+    }
+  }
+
+  // Build null mask from no_null_entry: false/null → bit=0 (null), true → bit=1 (valid).
+  auto [entry_mask_uptr, entry_nc] = cudf::bools_to_mask(*no_null_entry, stream, temp_mr);
+
+  // Since any_null_entry == true, no_null_entry has at least one false/null bit, so entry_nc > 0.
+  CUDF_EXPECTS(
+    entry_nc > 0,
+    "map_from_entries: reached slow path with entry_nc == 0 — fast path invariant broken");
+
+  // Combine input's existing null mask with entry_mask via the offset-aware raw-bitmask overload
+  // so input.null_mask() is consumed from input.offset() while entry_mask starts at bit 0.
+  // The resulting combined_mask_buf is always bit-0-aligned for input.size() rows.
+  auto const entry_mask_ptr = static_cast<cudf::bitmask_type const*>(entry_mask_uptr->data());
+  std::vector<cudf::bitmask_type const*> masks;
+  std::vector<cudf::size_type> begin_bits;
+  if (input.nullable()) {
+    masks.push_back(input.null_mask());
+    begin_bits.push_back(input.offset());
+  }
+  masks.push_back(entry_mask_ptr);
+  begin_bits.push_back(0);
+  auto [combined_mask_buf, combined_nc] =
+    cudf::bitmask_and(cudf::host_span<cudf::bitmask_type const* const>{masks.data(), masks.size()},
+                      cudf::host_span<cudf::size_type const>{begin_bits.data(), begin_bits.size()},
+                      input.size(),
+                      stream,
+                      temp_mr);
+  auto const* mask_ptr = static_cast<cudf::bitmask_type const*>(combined_mask_buf.data());
+
+  // combined_mask_buf stores valid bits starting at bit 0 for input.size() rows, so
+  // result_view must use offset=0. For sliced input, slice the offsets child to start at
+  // input.offset() so list row ranges remain correct with the new zero offset.
+  auto const raw_offsets    = input.child(cudf::lists_column_view::offsets_column_index);
+  auto const sliced_offsets = cudf::column_view(raw_offsets.type(),
+                                                input.size() + 1,
+                                                raw_offsets.head<void>(),
+                                                nullptr,
+                                                0,
+                                                raw_offsets.offset() + input.offset());
+
+  auto const result_view =
+    cudf::column_view(input.type(),
+                      input.size(),
+                      nullptr,
+                      mask_ptr,
+                      combined_nc,
+                      /*offset=*/0,
+                      {sliced_offsets, input.child(cudf::lists_column_view::child_column_index)});
+  // purge_nonempty_nulls adjusts list offsets so each null outer row has an empty span,
+  // satisfying cudf's invariant that null rows in nested columns are empty.
+  return cudf::purge_nonempty_nulls(result_view, stream, mr);
+}
+
+}  // namespace spark_rapids_jni
diff --git a/src/main/cpp/src/map_utils.hpp b/src/main/cpp/src/map_utils.hpp
@@ -0,0 +1,62 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#pragma once
+
+#include <cudf/column/column_view.hpp>
+#include <cudf/utilities/default_stream.hpp>
+#include <cudf/utilities/memory_resource.hpp>
+
+#include <rmm/cuda_stream_view.hpp>
+
+#include <memory>
+
+namespace spark_rapids_jni {
+
+/**
+ * @brief Converts a LIST(STRUCT(KEY, VALUE)) column to a map column following Spark semantics.
+ *
+ * Spark semantics for map_from_entries:
+ *  - If a row's array contains any null struct entry (the whole struct is null), the output row
+ *    is null — even if another entry in that same row has a null key.
+ *  - If a row's array contains no null struct entry but does contain a null key inside a valid
+ *    struct, behavior depends on throw_on_null_key:
+ *      - true  → throws a logic_error ("Cannot use null as map key.")
+ *      - false → returns the row as-is (caller is responsible for deduplication policy)
+ *
+ * This function only handles null-struct masking and null-key validation.
+ * Duplicate-key deduplication is left to the caller.
+ *
+ * Sliced inputs are supported: only rows in the range
+ * `[input.offset(), input.offset() + input.size())` are inspected.
+ *
+ * @throws cudf::logic_error if the input is not a LIST(STRUCT(KEY,...)) column.
+ * @throws cudf::logic_error if @p throw_on_null_key is true and any row (with no null struct
+ *         entries) contains a null key inside a valid struct.
+ * @param input           Input LIST(STRUCT(KEY, VALUE)) column.
+ * @param throw_on_null_key  When true, throw if any valid-struct entry has a null key.
+ * @param stream          CUDA stream used for device memory operations and kernel launches.
+ * @param mr              Device memory resource used to allocate the returned column's memory.
+ * @return A new column equal to @p input except that rows containing null struct entries are
+ *         replaced with a null outer row.
+ */
+[[nodiscard]] std::unique_ptr<cudf::column> map_from_entries(
+  cudf::column_view const& input,
+  bool throw_on_null_key,
+  rmm::cuda_stream_view stream      = cudf::get_default_stream(),
+  rmm::device_async_resource_ref mr = cudf::get_current_device_resource_ref());
+
+}  // namespace spark_rapids_jni
diff --git a/src/main/cpp/tests/CMakeLists.txt b/src/main/cpp/tests/CMakeLists.txt
@@ -113,6 +113,9 @@ ConfigureTest(LIST_SLICE
 ConfigureTest(MAP_ZIP_WITH
     map_zip_with_utils.cpp)
 
+ConfigureTest(MAP_UTILS
+    map_utils.cpp)
+
 ConfigureTest(SUBSTRING_INDEX
     substring_index.cpp)