NVIDIA
diff --git a/‎.github/workflows/shell-check.yml‎
Lines changed: 41 additions & 0 deletions b/‎.github/workflows/shell-check.yml‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎.gitmodules‎
Lines changed: 1 addition & 1 deletion b/‎.gitmodules‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎CONTRIBUTING.md‎
Lines changed: 1 addition & 1 deletion b/‎CONTRIBUTING.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎build/apply-patches‎
Lines changed: 3 additions & 3 deletions b/‎build/apply-patches‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎build/run-in-docker‎
Lines changed: 3 additions & 3 deletions b/‎build/run-in-docker‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎build/unapply-patches‎
Lines changed: 4 additions & 4 deletions b/‎build/unapply-patches‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎ci/Jenkinsfile.premerge‎
Lines changed: 4 additions & 4 deletions b/‎ci/Jenkinsfile.premerge‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎ci/deploy.sh‎
Lines changed: 2 additions & 2 deletions b/‎ci/deploy.sh‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/memory_management.md‎
Lines changed: 6 additions & 2 deletions b/‎docs/memory_management.md‎
Lines changed: 6 additions & 2 deletions
diff --git a/‎pom.xml‎
Lines changed: 19 additions & 32 deletions b/‎pom.xml‎
Lines changed: 19 additions & 32 deletions
@@ -0,0 +1,41 @@
+# Copyright (c) 2025, NVIDIA CORPORATION.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+# A workflow to check shell script syntax
+name: shell check
+
+on:
+  pull_request:
+    types: [opened, synchronize, reopened]
+
+jobs:
+  shell-check:
+    runs-on: ubuntu-latest
+    if: "!contains(github.event.pull_request.title, '[bot]')"
+    steps:
+      - name: Checkout code
+        uses: NVIDIA/spark-rapids-common/checkout@main
+
+      - name: Run ShellCheck
+        uses: NVIDIA/spark-rapids-common/shell-check@main
+        with:
+          excluded_codes:
+            SC3010,
+            SC2054,
+            SC2124
+          # code explanation:
+          # SC3010: In POSIX sh, [[ ]] is undefined.
+          # SC2054: Use spaces, not commas, to separate array elements.
+          # SC2124: Assigning an array to a string! Assign as array, or use * instead of @ to concatenate.
+          
@@ -1,4 +1,4 @@
 [submodule "thirdparty/cudf"]
 	path = thirdparty/cudf
 	url = https://github.com/rapidsai/cudf.git
-	branch = branch-25.10
+	branch = branch-25.12
@@ -165,7 +165,7 @@ $ ./build/build-in-docker install ...
 ```
 
 Now cd to ~/repos/NVIDIA/spark-rapids and build with one of the options from
-[spark-rapids instructions](https://github.com/NVIDIA/spark-rapids/blob/branch-25.10/CONTRIBUTING.md#building-from-source).
+[spark-rapids instructions](https://github.com/NVIDIA/spark-rapids/blob/branch-25.12/CONTRIBUTING.md#building-from-source).
 
 ```bash
 $ ./build/buildall
 
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 #
-# Copyright (c) 2024, NVIDIA CORPORATION. All rights reserved.
+# Copyright (c) 2024-2025, NVIDIA CORPORATION. All rights reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -51,7 +51,7 @@ fi
 
 CHANGED_FILES=$(git status --porcelain --untracked-files=no)
 
-if [ \( -s "$FULLY_PATCHED_FILE" \) -a  \( -n "$CHANGED_FILES" \) ] ; then 
+if [ -s "$FULLY_PATCHED_FILE" ] && [ -n "$CHANGED_FILES" ] ; then 
   if git apply -R --check "$FULLY_PATCHED_FILE" ; then
     echo "Patches appear to have been applied already"
     exit 0
@@ -60,7 +60,7 @@ fi
 
 if [ -n "$CHANGED_FILES" ] ; then
   echo "Error: CUDF repository has uncommitted changes. No patches will be applied. Please clean the repository so we can try and add the needed patches"
-  echo "$CHANGED_FILE"
+  echo "$CHANGED_FILES"
   exit 1
 fi
 
 
@@ -89,7 +89,7 @@ if [[ "$HOST_CUDA_PATH" != "" ]]; then
   RO_DST+=("/usr/local/cuda")
 fi
 for (( i=0; i<${#RO_SRC[@]}; i++)); do
-  MNT_ARGS+=(--mount type=bind,src=${RO_SRC[$i]},dst=${RO_DST[$i]},ro)
+  MNT_ARGS+=(--mount "type=bind,src=${RO_SRC[$i]},dst=${RO_DST[$i]},ro")
 done
 
 RW_SRC=(
@@ -99,11 +99,11 @@ RW_SRC=(
   "$LOCAL_MAVEN_REPO"
 )
 for (( i=0; i<${#RW_SRC[@]}; i++)); do
-  MNT_ARGS+=(--mount type=bind,src=${RW_SRC[$i]},dst=${RW_SRC[$i]})
+  MNT_ARGS+=(--mount "type=bind,src=${RW_SRC[$i]},dst=${RW_SRC[$i]}")
 done
 
 $DOCKER_CMD run $DOCKER_GPU_OPTS $DOCKER_RUN_EXTRA_ARGS -u $(id -u):$(id -g) --rm \
-  ${MNT_ARGS[@]} \
+  "${MNT_ARGS[@]}" \
   --workdir "$WORKDIR" \
   -e CCACHE_DIR="$LOCAL_CCACHE_DIR" \
   -e CMAKE_C_COMPILER_LAUNCHER="ccache" \
 
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 #
-# Copyright (c) 2024, NVIDIA CORPORATION. All rights reserved.
+# Copyright (c) 2024-2025, NVIDIA CORPORATION. All rights reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -51,7 +51,7 @@ fi
 
 CHANGED_FILES=$(git status --porcelain --untracked-files=no)
 
-if [ \( -s "$FULLY_PATCHED_FILE" \) -a  \( -n "$CHANGED_FILES" \) ] ; then
+if [ -s "$FULLY_PATCHED_FILE" ] && [ -n "$CHANGED_FILES" ] ; then
   if git apply --check -R "$FULLY_PATCHED_FILE"; then
     echo "Patches appear to have been applied, so going to remove them"
     git apply -R -v "$FULLY_PATCHED_FILE"
@@ -66,14 +66,14 @@ if [ \( -s "$FULLY_PATCHED_FILE" \) -a  \( -n "$CHANGED_FILES" \) ] ; then
 
     exit 0
   else
-    echo "Files are changed, but in a way where the full path file does not apply to remove them $FULL_PATCHED_FILE"
+    echo "Files are changed, but in a way where the full path file does not apply to remove them $FULLY_PATCHED_FILE"
     exit 1
   fi
 fi
 
 if [ -n "$CHANGED_FILES" ] ; then
   echo "Error: CUDF repository has uncommitted changes, but does not appear to have been patched. Please clean it and try again."
-  echo "$CHANGED_FILE"
+  echo "$CHANGED_FILES"
   exit 1
 else
   echo "No changes in CUDF repository to remove"
 
@@ -31,7 +31,7 @@ import ipp.blossom.*
 def githubHelper // blossom github helper
 def TEMP_IMAGE_BUILD = true
 def IMAGE_PREMERGE_CU12 = "${common.ARTIFACTORY_NAME}/sw-spark-docker/plugin-jni:rockylinux8-cuda12.9.1-blossom"
-def IMAGE_PREMERGE_CU13 = "${common.ARTIFACTORY_NAME}/sw-spark-docker/plugin-jni:rockylinux8-cuda13.0.0-blossom"
+def IMAGE_PREMERGE_CU13 = "${common.ARTIFACTORY_NAME}/sw-spark-docker/plugin-jni:rockylinux8-cuda13.0.1-blossom"
 def cpuImage = pod.getCPUYAML(IMAGE_PREMERGE_CU12)
 def PREMERGE_DOCKERFILE = 'ci/Dockerfile'
 def PREMERGE_TAG_CU12
@@ -162,7 +162,7 @@ git --no-pager diff --name-only HEAD \$BASE -- ${PREMERGE_DOCKERFILE} || true"""
                                 "--network=host -f ${PREMERGE_DOCKERFILE} -t $IMAGE_PREMERGE_CU12 .")
                             uploadDocker(IMAGE_PREMERGE_CU12)
                             docker.build(IMAGE_PREMERGE_CU13,
-                                "--network=host -f ${PREMERGE_DOCKERFILE} -t $IMAGE_PREMERGE_CU13 --build-arg CUDA_VERSION=13.0.0 .")
+                                "--network=host -f ${PREMERGE_DOCKERFILE} -t $IMAGE_PREMERGE_CU13 --build-arg CUDA_VERSION=13.0.1 .")
                             uploadDocker(IMAGE_PREMERGE_CU13)
                         }
                     }
@@ -214,7 +214,7 @@ git --no-pager diff --name-only HEAD \$BASE -- ${PREMERGE_DOCKERFILE} || true"""
                         kubernetes {
                             label "cu12-${BUILD_TAG}"
                             cloud "${common.CLOUD_NAME}"
-                            yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU12}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '38Gi')
+                            yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU12}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '48Gi')
                             customWorkspace "${CUSTOM_WORKSPACE}-cu12"
                         }
                     }
@@ -247,7 +247,7 @@ git --no-pager diff --name-only HEAD \$BASE -- ${PREMERGE_DOCKERFILE} || true"""
                         kubernetes {
                             label "cu13-${BUILD_TAG}"
                             cloud "${common.CLOUD_NAME}"
-                            yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU13}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '38Gi', '580.65.06')
+                            yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU13}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '48Gi', '580.82.07')
                             customWorkspace "${CUSTOM_WORKSPACE}-cu13"
                         }
                     }
 
@@ -1,6 +1,6 @@
 #!/bin/bash
 #
-# Copyright (c) 2022-2024, NVIDIA CORPORATION. All rights reserved.
+# Copyright (c) 2022-2025, NVIDIA CORPORATION. All rights reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -82,7 +82,7 @@ if [ "$SIGN_FILE" == true ]; then
         *)
             echo "Error unsupported sign type : $SIGN_TYPE !"
             echo "Please set variable SIGN_TOOL 'nvsec'or 'gpg'"
-            exit -1
+            exit 255
             ;;
     esac
 else
 
@@ -55,7 +55,11 @@ The selected thread transitions its state to `THREAD_SPLIT_THROW` and throws an
 
 ### Dedicated Threads vs. Pool Threads
 
-From the view of the OOM state machine, each task has one or more "dedicated threads", along with zero or more "pool threads". When checking whether a task is blocked, OOM state machine is lenient on dedicated threads (only require any one of the dedicated threads to be blocked), but stringent on pool threads (all pool threads must be blocked). Being treated leniently is not always a good thing, it increases the chance of being mistakenly identified as a block task, thus causing unnecessary deadlock resolution. So we don't want a thread to be treated as a dedicated thread unless it is really necessary. There are two ways of avoiding a thread being treated as a dedicated thread:
+From the view of the OOM state machine, each task has one or more "dedicated threads", along with zero or more "pool threads" (background threads). When checking whether a task is blocked, OOM state machine is lenient on dedicated threads (only require any one of the dedicated threads to be blocked), but stringent on pool threads (all pool threads must be blocked). Being treated leniently is not always a good thing, it increases the chance of being mistakenly identified as a blocked task, thus causing unnecessary deadlock resolution. So we don't want a thread to be treated as a dedicated thread unless it is really necessary. There are two ways of avoiding a thread being treated as a dedicated thread:
 
 1. Avoid calling TaskContext.setTaskContext() in the current thread, this will prevent OOM state machine connecting the current thread to the task as a dedicated thread. 
-2. If you have to set TaskContext, then it's also a good idea to proactively register thread itself as a pool thread instead of a dedicated thread. An example can be found [here](https://github.com/NVIDIA/spark-rapids/blob/c39f6a6004b0cf684ca526172e87b2bd4481eb3a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcScan.scala#L2056) for registering threads.
+2. Proactively register thread itself as a pool thread instead of a dedicated thread. An example can be found [here](https://github.com/NVIDIA/spark-rapids/blob/c39f6a6004b0cf684ca526172e87b2bd4481eb3a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcScan.scala#L2056) for registering threads. (Don't forget to unregister the thread when it is done.)
+
+In most cases, we recommend the second approach, because typically the main task and the background thread will form a producer-consumer relationship. The main task thread, which plays as a consumer, will typically wait for the background thread to produce data. If we choose approach 1 then while consumer is waiting, its Java thread state will be `WAITING`, and even if the producer is actively working (so the whole task should NOT be considered as blocked), the OOM state machine will mistakenly consider it as a blocked task because it cannot find any "pool thread" connected with this task. So "has at least one dedicated thread blocked on memory allocation, and all of the pool threads working on that task are also blocked" stands. 
+
+However, if we choose approach 2, then the OOM state machine will find at least one pool thread is NOT blocked, so "has at least one dedicated thread blocked on memory allocation, and all of the pool threads working on that task are also blocked" does NOT stand, then the task will NOT be considered as blocked. 
@@ -21,7 +21,7 @@
 
   <groupId>com.nvidia</groupId>
   <artifactId>spark-rapids-jni</artifactId>
-  <version>25.10.0-SNAPSHOT</version>
+  <version>25.12.0-SNAPSHOT</version>
   <packaging>jar</packaging>
   <name>RAPIDS Accelerator JNI for Apache Spark</name>
   <description>
@@ -95,6 +95,7 @@
     <jni.classifier>${cuda.version}</jni.classifier>
     <cudf.path>${project.basedir}/thirdparty/cudf</cudf.path>
     <cudf.pin.path>${project.basedir}/thirdparty/cudf-pins/</cudf.pin.path>
+    <guava.version>14.0.1</guava.version>
     <hadoop.version>3.4.0</hadoop.version>
     <junit.version>5.8.1</junit.version>
     <libcudf.build.path>${project.build.directory}/libcudf/cmake-build/</libcudf.build.path>
@@ -122,26 +123,28 @@
 
   <dependencies>
     <dependency>
-      <groupId>org.apache.arrow</groupId>
-      <artifactId>arrow-vector</artifactId>
-      <version>${arrow.version}</version>
-      <scope>test</scope>
+      <groupId>org.apache.hadoop</groupId>
+      <artifactId>hadoop-client-api</artifactId>
+      <version>${hadoop.version}</version>
+      <scope>provided</scope>
     </dependency>
     <dependency>
       <groupId>org.apache.hadoop</groupId>
-      <artifactId>hadoop-common</artifactId>
+      <artifactId>hadoop-client-runtime</artifactId>
       <version>${hadoop.version}</version>
       <scope>test</scope>
-      <exclusions>
-        <exclusion>
-          <groupId>org.slf4j</groupId>
-          <artifactId>slf4j-reload4j</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>org.slf4j</groupId>
-          <artifactId>slf4j-log4j12</artifactId>
-        </exclusion>
-      </exclusions>
+    </dependency>
+    <dependency>
+      <groupId>com.google.guava</groupId>
+      <artifactId>guava</artifactId>
+      <version>${guava.version}</version>
+      <scope>test</scope>
+    </dependency>
+    <dependency>
+      <groupId>org.apache.arrow</groupId>
+      <artifactId>arrow-vector</artifactId>
+      <version>${arrow.version}</version>
+      <scope>test</scope>
     </dependency>
     <dependency>
       <groupId>org.apache.parquet</groupId>
@@ -190,22 +193,6 @@
       <version>${hilbert.version}</version>
       <scope>test</scope>
     </dependency>
-    <dependency>
-      <groupId>org.apache.hadoop</groupId>
-      <artifactId>hadoop-mapreduce-client-core</artifactId>
-      <version>${hadoop.version}</version>
-      <scope>test</scope>
-      <exclusions>
-        <exclusion>
-          <groupId>org.slf4j</groupId>
-          <artifactId>*</artifactId>
-        </exclusion>
-        <exclusion>
-          <groupId>ch.qos.reload4j</groupId>
-          <artifactId>*</artifactId>
-        </exclusion>
-      </exclusions>
-    </dependency>
   </dependencies>
 
   <profiles>
Original file line number	Diff line number	Diff line change
`@@ -31,7 +31,7 @@ import ipp.blossom.*`
`31`	`31`	`def githubHelper // blossom github helper`
`32`	`32`	`def TEMP_IMAGE_BUILD = true`
`33`	`33`	`def IMAGE_PREMERGE_CU12 = "${common.ARTIFACTORY_NAME}/sw-spark-docker/plugin-jni:rockylinux8-cuda12.9.1-blossom"`
`34`		`-def IMAGE_PREMERGE_CU13 = "${common.ARTIFACTORY_NAME}/sw-spark-docker/plugin-jni:rockylinux8-cuda13.0.0-blossom"`
	`34`	`+def IMAGE_PREMERGE_CU13 = "${common.ARTIFACTORY_NAME}/sw-spark-docker/plugin-jni:rockylinux8-cuda13.0.1-blossom"`
`35`	`35`	`def cpuImage = pod.getCPUYAML(IMAGE_PREMERGE_CU12)`
`36`	`36`	`def PREMERGE_DOCKERFILE = 'ci/Dockerfile'`
`37`	`37`	`def PREMERGE_TAG_CU12`
`@@ -162,7 +162,7 @@ git --no-pager diff --name-only HEAD \$BASE -- ${PREMERGE_DOCKERFILE} \|\| true"""`
`162`	`162`	`"--network=host -f ${PREMERGE_DOCKERFILE} -t $IMAGE_PREMERGE_CU12 .")`
`163`	`163`	`uploadDocker(IMAGE_PREMERGE_CU12)`
`164`	`164`	`docker.build(IMAGE_PREMERGE_CU13,`
`165`		`- "--network=host -f ${PREMERGE_DOCKERFILE} -t $IMAGE_PREMERGE_CU13 --build-arg CUDA_VERSION=13.0.0 .")`
	`165`	`+ "--network=host -f ${PREMERGE_DOCKERFILE} -t $IMAGE_PREMERGE_CU13 --build-arg CUDA_VERSION=13.0.1 .")`
`166`	`166`	`uploadDocker(IMAGE_PREMERGE_CU13)`
`167`	`167`	`}`
`168`	`168`	`}`
`@@ -214,7 +214,7 @@ git --no-pager diff --name-only HEAD \$BASE -- ${PREMERGE_DOCKERFILE} \|\| true"""`
`214`	`214`	`kubernetes {`
`215`	`215`	`label "cu12-${BUILD_TAG}"`
`216`	`216`	`cloud "${common.CLOUD_NAME}"`
`217`		`- yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU12}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '38Gi')`
	`217`	`+ yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU12}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '48Gi')`
`218`	`218`	`customWorkspace "${CUSTOM_WORKSPACE}-cu12"`
`219`	`219`	`}`
`220`	`220`	`}`
`@@ -247,7 +247,7 @@ git --no-pager diff --name-only HEAD \$BASE -- ${PREMERGE_DOCKERFILE} \|\| true"""`
`247`	`247`	`kubernetes {`
`248`	`248`	`label "cu13-${BUILD_TAG}"`
`249`	`249`	`cloud "${common.CLOUD_NAME}"`
`250`		`- yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU13}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '38Gi', '580.65.06')`
	`250`	`+ yaml pod.getGPUYAMLwithVolume("${IMAGE_PREMERGE_CU13}", "${env.GPU_RESOURCE}", "${PVC}", "${PVC_MOUNT_PATH}", '10', '48Gi', '580.82.07')`
`251`	`251`	`customWorkspace "${CUSTOM_WORKSPACE}-cu13"`
`252`	`252`	`}`
`253`	`253`	`}`