diff --git a/aggregator/pom.xml b/aggregator/pom.xml
index 5e3e8be4abc..983c4ee4bac 100644
--- a/aggregator/pom.xml
+++ b/aggregator/pom.xml
@@ -45,6 +45,7 @@
         <!-- Maven to register attached artifact , which we later replace -->
         <rapids.shim.jar.phase>initialize</rapids.shim.jar.phase>
         <rapids.source.jar.phase>none</rapids.source.jar.phase>
+        <rapids.aggregator.downstream.refresh.skip>false</rapids.aggregator.downstream.refresh.skip>
     </properties>
     <dependencies>
         <dependency>
@@ -196,6 +197,7 @@
                         <goals><goal>run</goal></goals>
                         <phase>process-classes</phase>
                         <configuration>
+                            <skip>${rapids.aggregator.downstream.refresh.skip}</skip>
                             <target>
                                 <taskdef resource="net/sf/antcontrib/antcontrib.properties"/>
                                 <property name="realAggJar"
diff --git a/build/buildall b/build/buildall
index 6c977f3ba5c..33c8c445f5f 100755
--- a/build/buildall
+++ b/build/buildall
@@ -22,6 +22,25 @@ shopt -s extglob
 SKIP_CLEAN=1
 BUILD_ALL_DEBUG=0
 SCALA213=0
+UNSHIM_FAST=0
+UNSHIM_PARALLEL_WORLD_ONLY=0
+UNSHIM_REUSE_BUILT_JARS=0
+UNSHIM_ALLOWLIST_ONLY=0
+
+SCRIPT_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" >/dev/null 2>&1 && pwd)
+SOURCE_DIR=$(cd "$SCRIPT_DIR/.." >/dev/null 2>&1 && pwd)
+
+function first_pom_value() {
+  local key="$1"
+  local pom="$2"
+  sed -n "0,/<$key>/{s|.*<$key>\([^<]*\)</$key>.*|\1|p}" "$pom" | head -n 1
+}
+
+function last_pom_value() {
+  local key="$1"
+  local pom="$2"
+  sed -n "s|.*<$key>\([^<]*\)</$key>.*|\1|p" "$pom" | tail -n 1
+}
 
 function join_by { local IFS="$1"; shift; echo "$*"; }
 
@@ -56,6 +75,14 @@ function print_usage() {
   echo "        repackage the dist module artifact using installed dependencies"
   echo "   --scala213"
   echo "        build 2.13 shims"
+  echo "   --unshim-fast"
+  echo "        skip Maven checks/docs, tests, build metadata, coverage, enforcer, and snapshot refresh for repeated unshim/dist iteration"
+  echo "   --parallel-world-only, --unshim-parallel-world-only"
+  echo "        build analyzer-only parallel-world output without the final Maven dist invocation"
+  echo "   --unshim-reuse-built-jars"
+  echo "        with --unshim-fast --parallel-world-only, skip shim Maven builds and reuse existing target jars"
+  echo "   --unshim-allowlist-only"
+  echo "        imply --unshim-fast --parallel-world-only --unshim-reuse-built-jars and require only unshim allowlist changes"
 }
 
 function bloopInstall() {
@@ -148,6 +175,25 @@ case "$1" in
   SCALA213=1
   ;;
 
+--unshim-fast|--fast-unshim)
+  UNSHIM_FAST=1
+  ;;
+
+--parallel-world-only|--unshim-parallel-world-only)
+  UNSHIM_PARALLEL_WORLD_ONLY=1
+  ;;
+
+--unshim-reuse-built-jars)
+  UNSHIM_REUSE_BUILT_JARS=1
+  ;;
+
+--unshim-allowlist-only)
+  UNSHIM_ALLOWLIST_ONLY=1
+  UNSHIM_FAST=1
+  UNSHIM_PARALLEL_WORLD_ONLY=1
+  UNSHIM_REUSE_BUILT_JARS=1
+  ;;
+
 --rebuild-dist-only)
   SKIP_DIST_DEPS="1"
   MODULE="dist"
@@ -174,14 +220,62 @@ if [[ "$DIST_PROFILE" == *Scala213 ]]; then
   SCALA213=1
 fi
 
+if [[ "$UNSHIM_PARALLEL_WORLD_ONLY" == "1" ]]; then
+  FINAL_OP="generate-resources"
+  MODULE="${MODULE:-dist}"
+fi
+
 MVN=${MVN:-"mvn"}
 # include options to mvn command
 export MVN="$MVN -Dmaven.wagon.http.retryHandler.count=3 ${MVN_OPT}"
+if [[ "$UNSHIM_FAST" == "1" ]]; then
+  export MAVEN_REFRESH_OPT="--no-snapshot-updates"
+  export MVN_FAST_SKIP_OPTS="-Dmaven.test.skip=true -Drat.skip=true -Dmaven.scalastyle.skip=true -Dmaven.scaladoc.skip=true -Dmaven.javadoc.skip=true -Ddist.jar.compress=false -Djacoco.skip=true -Denforcer.skip=true -Drapids.build.info.skip=true -Dignore.shim.revisions.check=true"
+else
+  export MAVEN_REFRESH_OPT="-U"
+  export MVN_FAST_SKIP_OPTS=""
+fi
+export UNSHIM_FAST
+export UNSHIM_PARALLEL_WORLD_ONLY
+export UNSHIM_ALLOWLIST_ONLY
+
+if [[ "$UNSHIM_REUSE_BUILT_JARS" == "1" && \
+      ( "$UNSHIM_FAST" != "1" || "$UNSHIM_PARALLEL_WORLD_ONLY" != "1" ) ]]; then
+  echo >&2 "--unshim-reuse-built-jars requires --unshim-fast --parallel-world-only"
+  exit 1
+fi
+
+if [[ "$UNSHIM_ALLOWLIST_ONLY" == "1" ]] && \
+    git -C "$SOURCE_DIR" rev-parse --is-inside-work-tree >/dev/null 2>&1; then
+  ALLOWLIST_ONLY_DIRTY=$(
+    {
+      git -C "$SOURCE_DIR" diff --name-only -- \
+        . \
+        ':(exclude)dist/unshimmed-common-from-single-shim.txt' \
+        ':(exclude)dist/unshimmed-from-each-spark3xx.txt' \
+        ':(exclude)dist/keep-in-spark-shared.txt'
+      git -C "$SOURCE_DIR" diff --cached --name-only -- \
+        . \
+        ':(exclude)dist/unshimmed-common-from-single-shim.txt' \
+        ':(exclude)dist/unshimmed-from-each-spark3xx.txt' \
+        ':(exclude)dist/keep-in-spark-shared.txt'
+    } | sort -u
+  )
+  if [[ -n "$ALLOWLIST_ONLY_DIRTY" ]]; then
+    echo >&2 "--unshim-allowlist-only can only reuse jars when tracked changes are limited to dist/unshimmed*.txt or dist/keep-in-spark-shared.txt"
+    echo >&2 "$ALLOWLIST_ONLY_DIRTY"
+    exit 1
+  fi
+fi
 
 if [[ "$SCALA213" == "1" ]]; then
   POM_FILE="scala2.13/pom.xml"
   export MVN="$MVN -f scala2.13/"
-  $(dirname $0)/make-scala-version-build-files.sh 2.13
+  if [[ "$UNSHIM_FAST" == "1" && -f "$POM_FILE" ]]; then
+    echo "Unshim fast: reusing existing Scala 2.13 POMs"
+  else
+    "$SCRIPT_DIR"/make-scala-version-build-files.sh 2.13
+  fi
 else 
   POM_FILE="pom.xml"
 fi
@@ -216,7 +310,26 @@ case $DIST_PROFILE in
 esac
 
 echo "Spark versions involved: ${SPARK_SHIM_VERSIONS[@]} ..."
-export MVN_BASE_DIR=$($MVN help:evaluate -Dexpression=project.basedir -q -DforceStdout)
+if [[ "$UNSHIM_FAST" == "1" ]]; then
+  if [[ "$SCALA213" == "1" ]]; then
+    export MVN_BASE_DIR="$SOURCE_DIR/scala2.13"
+  else
+    export MVN_BASE_DIR="$SOURCE_DIR"
+  fi
+  export RAPIDS_PROJECT_VERSION=$(first_pom_value version "$POM_FILE")
+  export RAPIDS_SCALA_BINARY_VERSION=$(last_pom_value scala.binary.version "$POM_FILE")
+else
+  export MVN_BASE_DIR=$($MVN help:evaluate -Dexpression=project.basedir -q -DforceStdout)
+fi
+
+if [[ "$UNSHIM_PARALLEL_WORLD_ONLY" == "1" ]]; then
+  echo "Unshim parallel-world-only: preparing analyzer-only output and skipping JNI unpack, shimplify, and reduced POM generation"
+  MVN_FAST_SKIP_OPTS="$MVN_FAST_SKIP_OPTS -Drapids.jni.unpack.skip=true -Drapids.shimplify.skip=true -Drapids.parallel.world.skip.reduced.pom=true -Drapids.aggregator.downstream.refresh.skip=true"
+elif [[ "$UNSHIM_FAST" == "1" && -d "$MVN_BASE_DIR/dist/target/jni-deps" ]]; then
+  echo "Unshim fast: reusing existing JNI deps from $MVN_BASE_DIR/dist/target/jni-deps"
+  MVN_FAST_SKIP_OPTS="$MVN_FAST_SKIP_OPTS -Drapids.jni.unpack.skip=true"
+fi
+export MVN_FAST_SKIP_OPTS
 
 if [[ "$GEN_BLOOP" == "true" ]]; then
   bloopInstall
@@ -237,9 +350,45 @@ fi
 
 echo "Building a combined dist jar with Shims for ${SPARK_SHIM_VERSIONS[@]} ..."
 
+function refresh_fast_aggregator_jar() {
+  [[ "$UNSHIM_FAST" == "1" ]] || return 0
+  local BUILD_VER=$1
+  local agg_dir="$MVN_BASE_DIR/aggregator/target/spark$BUILD_VER"
+  local agg_base="rapids-4-spark-aggregator_${RAPIDS_SCALA_BINARY_VERSION}-${RAPIDS_PROJECT_VERSION}"
+  local shaded_jar="$agg_dir/${agg_base}-shaded.jar"
+  local downstream_jar="$agg_dir/${agg_base}-spark$BUILD_VER.jar"
+  if [[ ! -f "$shaded_jar" ]]; then
+    echo >&2 "Expected shaded aggregator jar missing: $shaded_jar"
+    exit 255
+  fi
+  if [[ -f "$downstream_jar" ]] && cmp -s "$shaded_jar" "$downstream_jar"; then
+    return 0
+  fi
+  cp -p "$shaded_jar" "$downstream_jar"
+}
+export -f refresh_fast_aggregator_jar
+
+function verify_reusable_unshim_artifacts() {
+  local BUILD_VER=$1
+  local classifier="spark$BUILD_VER"
+  local api_base="rapids-4-spark-sql-plugin-api_${RAPIDS_SCALA_BINARY_VERSION}-${RAPIDS_PROJECT_VERSION}"
+  local agg_base="rapids-4-spark-aggregator_${RAPIDS_SCALA_BINARY_VERSION}-${RAPIDS_PROJECT_VERSION}"
+  local api_jar="$MVN_BASE_DIR/sql-plugin-api/target/$classifier/${api_base}-$classifier.jar"
+  local agg_shaded_jar="$MVN_BASE_DIR/aggregator/target/$classifier/${agg_base}-shaded.jar"
+  local jar_path
+  for jar_path in "$api_jar" "$agg_shaded_jar"; do
+    if [[ ! -f "$jar_path" ]]; then
+      echo >&2 "Expected reusable unshim artifact missing: $jar_path"
+      echo >&2 "Re-run without --unshim-reuse-built-jars after source or dependency changes."
+      exit 255
+    fi
+  done
+}
+export -f verify_reusable_unshim_artifacts
+
 function build_single_shim() {
   [[ "$BUILD_ALL_DEBUG" == "1" ]] && set -x
-  BUILD_VER=$1
+  local BUILD_VER=$1
   mkdir -p "$MVN_BASE_DIR/target"
   if (( BUILD_PARALLEL == 1 || NUM_SHIMS == 1 )); then
     # Single-shim/serial build: stream Maven output live rather than to a log
@@ -255,8 +404,8 @@ function build_single_shim() {
     LOG_FILE="$MVN_BASE_DIR/target/mvn-build-$BUILD_VER.log"
   fi
 
-  if [[ "$BUILD_VER" == "$BASE_VER" ]]; then
-    SKIP_CHECKS="false"
+  if [[ "$BUILD_VER" == "$BASE_VER" && \
+        ( "$UNSHIM_FAST" != "1" || "$UNSHIM_PARALLEL_WORLD_ONLY" != "1" ) ]]; then
     # WORKAROUND:
     # maven build on L193 currently relies on aggregator dependency which
     # will removed by
@@ -267,10 +416,20 @@ function build_single_shim() {
     #
     MVN_PHASE="install"
   else
-    SKIP_CHECKS="true"
     MVN_PHASE="package"
   fi
 
+  if [[ "$UNSHIM_FAST" == "1" || "$BUILD_VER" != "$BASE_VER" ]]; then
+    SKIP_CHECKS="true"
+  else
+    SKIP_CHECKS="false"
+  fi
+
+  local BUILD_PROJECTS="tools"
+  if [[ "$UNSHIM_FAST" == "1" ]]; then
+    BUILD_PROJECTS="aggregator"
+  fi
+
   echo "#### REDIRECTING mvn output to ${LOG_FILE:-stdout} ####"
   (
     if [[ "$LOG_FILE" == "" ]]; then
@@ -278,13 +437,15 @@ function build_single_shim() {
     else
       exec > "$LOG_FILE" 2>&1 || exit $?
     fi
-    $MVN -U "$MVN_PHASE" \
+    $MVN $MAVEN_REFRESH_OPT "$MVN_PHASE" \
         -DskipTests \
         -Dbuildver="$BUILD_VER" \
         -Drat.skip="$SKIP_CHECKS" \
-        -Dmaven.scaladoc.skip \
+        -Dmaven.scaladoc.skip=true \
+        -Dmaven.javadoc.skip=true \
         -Dmaven.scalastyle.skip="$SKIP_CHECKS" \
-        -pl tools -am
+        $MVN_FAST_SKIP_OPTS \
+        -pl "$BUILD_PROJECTS" -am
   ) || {
         # Only tail when output went to a real log file; for a live stream
         # (/dev/tty or existing stdout) the failure output is already on screen.
@@ -294,6 +455,7 @@ function build_single_shim() {
         esac
         exit 255
       }
+  refresh_fast_aggregator_jar "$BUILD_VER"
 }
 export -f build_single_shim
 
@@ -310,25 +472,62 @@ export -f build_single_shim
 time (
   # printf a single buildver array element per line
   if [[ "$SKIP_DIST_DEPS" != "1" ]]; then
+    if [[ "$UNSHIM_REUSE_BUILT_JARS" == "1" ]]; then
+      echo "Unshim fast: reusing existing per-shim jars and skipping Maven shim builds"
+      for bv in "${SPARK_SHIM_VERSIONS[@]}"; do
+        verify_reusable_unshim_artifacts "$bv"
+        refresh_fast_aggregator_jar "$bv"
+      done
+    else
     # Execute initialize to download a massive jar for spark-rapids-jni in a single thread to
-    # avoid repeating this work in parallel
-    # Initialize sql-plugin-api only to avoid dealing with missing submodule dependencies
-    #
-    $MVN initialize -pl sql-plugin-api -am
+    # avoid repeating this work in parallel. This is unnecessary in unshim-fast modes that skip
+    # JNI unpacking.
+    if [[ "$UNSHIM_FAST" == "1" && "$MVN_FAST_SKIP_OPTS" == *"-Drapids.jni.unpack.skip=true"* ]]; then
+      echo "Unshim fast: skipping serial Maven initialize preflight"
+    else
+      # Initialize sql-plugin-api only to avoid dealing with missing submodule dependencies.
+      $MVN initialize -pl sql-plugin-api -am
+    fi
 
     printf "%s\n" "${SPARK_SHIM_VERSIONS[@]}" | \
       xargs -t -I% -P "$BUILD_PARALLEL" -n 1 \
       bash -c 'build_single_shim "$@"' _ %
+    fi
   fi
-  # This used to resume from dist. However, without including aggregator in the build
-  # the build does not properly initialize spark.version property via buildver profiles
-  # in the root pom, and we get a missing spark330 dependency even for --profile=330,331
-  # where the build does not require it. Moving it to aggregator resolves this issue with
-  # a negligible increase of the build time by ~2 seconds.
+  if [[ "$UNSHIM_FAST" == "1" && "$UNSHIM_REUSE_BUILT_JARS" != "1" ]]; then
+    for bv in "${SPARK_SHIM_VERSIONS[@]}"; do
+      refresh_fast_aggregator_jar "$bv"
+    done
+  fi
+  # Non-fast builds resume from aggregator so Maven initializes the buildver-derived
+  # spark.version.classifier before dist resolves its aggregator dependency. The unshim-fast
+  # dist path can skip that extra aggregator pass because the per-shim builds above already
+  # installed the base aggregator jar and refreshed all target aggregator jars.
   joinShimBuildFrom="aggregator"
   INCLUDED_BUILDVERS_OPT=-Dincluded_buildvers=$(join_by , "${SPARK_SHIM_VERSIONS[@]}")
-  echo "Resuming from $joinShimBuildFrom build only using $BASE_VER"
-  $MVN $FINAL_OP -rf $joinShimBuildFrom $MODULE_OPT $MVN_PROFILE_OPT $INCLUDED_BUILDVERS_OPT \
+  if [[ "$UNSHIM_FAST" == "1" && "$MODULE" == "dist" ]]; then
+    if [[ "$UNSHIM_PARALLEL_WORLD_ONLY" == "1" ]]; then
+      echo "Unshim fast: assembling parallel-world directly without final Maven dist invocation"
+      python3 "$SOURCE_DIR/dist/scripts/build-unshim-parallel-world.py" \
+        --mvn-base-dir "$MVN_BASE_DIR" \
+        --source-dir "$SOURCE_DIR" \
+        --project-version "$RAPIDS_PROJECT_VERSION" \
+        --scala-binary-version "$RAPIDS_SCALA_BINARY_VERSION" \
+        --buildvers "$(join_by , "${SPARK_SHIM_VERSIONS[@]}")" \
+        --ignore-shim-revisions-check
+      exit 0
+    else
+      echo "Resuming at dist only using $BASE_VER"
+      FINAL_RESUME_OPT=""
+      FINAL_MODULE_OPT="--projects dist"
+    fi
+  else
+    echo "Resuming from $joinShimBuildFrom build only using $BASE_VER"
+    FINAL_RESUME_OPT="-rf $joinShimBuildFrom"
+    FINAL_MODULE_OPT="$MODULE_OPT"
+  fi
+  $MVN $FINAL_OP $FINAL_RESUME_OPT $FINAL_MODULE_OPT $MVN_PROFILE_OPT $INCLUDED_BUILDVERS_OPT \
     -Dbuildver="$BASE_VER" \
-    -DskipTests -Dmaven.scaladoc.skip
+    -DskipTests -Dmaven.scaladoc.skip=true -Dmaven.javadoc.skip=true \
+    $MVN_FAST_SKIP_OPTS
 )
diff --git a/delta-lake/common/src/main/databricks/scala/com/databricks/sql/transaction/tahoe/rapids/GpuCheckDeltaInvariant.scala b/delta-lake/common/src/main/databricks/scala/com/databricks/sql/transaction/tahoe/rapids/GpuCheckDeltaInvariant.scala
index f7d5a9f402b..045ca4d238b 100644
--- a/delta-lake/common/src/main/databricks/scala/com/databricks/sql/transaction/tahoe/rapids/GpuCheckDeltaInvariant.scala
+++ b/delta-lake/common/src/main/databricks/scala/com/databricks/sql/transaction/tahoe/rapids/GpuCheckDeltaInvariant.scala
@@ -136,7 +136,7 @@ object GpuCheckDeltaInvariant extends Logging {
     ExprChecks.projectOnly(
       TypeSig.all,
       TypeSig.all,
-      paramCheck = Seq(ParamCheck("input", TypeSig.all, TypeSig.all))),
+      paramCheck = Seq(new ParamCheck("input", TypeSig.all, TypeSig.all))),
     (c, conf, p, r) => new GpuCheckDeltaInvariantMeta(c, conf, p, r))
 
   def maybeConvertToGpu(
diff --git a/delta-lake/common/src/main/databricks/scala/com/nvidia/spark/rapids/delta/DatabricksDeltaProviderBase.scala b/delta-lake/common/src/main/databricks/scala/com/nvidia/spark/rapids/delta/DatabricksDeltaProviderBase.scala
index 0520a924367..156cd168768 100644
--- a/delta-lake/common/src/main/databricks/scala/com/nvidia/spark/rapids/delta/DatabricksDeltaProviderBase.scala
+++ b/delta-lake/common/src/main/databricks/scala/com/nvidia/spark/rapids/delta/DatabricksDeltaProviderBase.scala
@@ -174,10 +174,10 @@ trait DatabricksDeltaProviderBase extends DeltaProviderImplBase {
       "Delta RTAS was tagged as unsupported and should not be converted to GPU")
   }
 
-  protected case class DeltaWriteV1Config(
-      deltaLog: DeltaLog,
-      forceOverwrite: Boolean,
-      options: mutable.HashMap[String, String])
+  protected class DeltaWriteV1Config(
+      val deltaLog: DeltaLog,
+      val forceOverwrite: Boolean,
+      val options: mutable.HashMap[String, String])
 
   private def extractWriteV1Config(
       meta: RapidsMeta[_, _, _],
@@ -210,7 +210,7 @@ trait DatabricksDeltaProviderBase extends DeltaProviderImplBase {
           f.get(outerObj).asInstanceOf[mutable.HashMap[String, String]]
         }
         if (forceOverwrite.isDefined && options.isDefined) {
-          Some(DeltaWriteV1Config(deltaLog, forceOverwrite.get, options.get))
+          Some(new DeltaWriteV1Config(deltaLog, forceOverwrite.get, options.get))
         } else {
           meta.willNotWorkOnGpu(s"write class has unsupported outer class $outerClass")
           None
diff --git a/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/DeltaProviderBase.scala b/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/DeltaProviderBase.scala
index 84ab70e804a..0cee43f69d0 100644
--- a/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/DeltaProviderBase.scala
+++ b/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/DeltaProviderBase.scala
@@ -41,11 +41,12 @@ import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
 // Expression support shared across versions - defined outside class to avoid serialization issues
-case class GpuIncrementMetricMeta(
-  cpuInc: IncrementMetric,
-  override val conf: RapidsConf,
-  p: Option[RapidsMeta[_, _, _]],
-  r: DataFromReplacementRule) extends ExprMeta[IncrementMetric](cpuInc, conf, p, r) {
+class GpuIncrementMetricMeta(
+    val cpuInc: IncrementMetric,
+    override val conf: RapidsConf,
+    val p: Option[RapidsMeta[_, _, _]],
+    val r: DataFromReplacementRule)
+    extends ExprMeta[IncrementMetric](cpuInc, conf, p, r) with Serializable {
   override def convertToGpuImpl(): GpuExpression = {
     val gpuChild = childExprs.head.convertToGpu()
     GpuIncrementMetric(cpuInc, gpuChild)
@@ -88,7 +89,7 @@ abstract class DeltaProviderBase extends DeltaIOProvider {
     GpuOverrides.expr[IncrementMetric](
       "IncrementMetric",
       ExprChecks.unaryProject(TypeSig.all, TypeSig.all, TypeSig.all, TypeSig.all),
-      (cpuInc, conf, p, r) => GpuIncrementMetricMeta(cpuInc, conf, p, r)
+      (cpuInc, conf, p, r) => new GpuIncrementMetricMeta(cpuInc, conf, p, r)
     )
   ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
 
diff --git a/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase.scala b/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase.scala
index 61c586b955e..fa3997dbdbc 100644
--- a/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase.scala
+++ b/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase.scala
@@ -26,7 +26,6 @@ import org.apache.hadoop.fs.Path
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
@@ -52,7 +51,7 @@ class GpuDeltaParquetFileFormatBase(
     optimizationsEnabled: Boolean = true,
     tablePath: Option[String] = None,
     isCDCRead: Boolean = false
-  ) extends com.nvidia.spark.rapids.delta.GpuDeltaParquetFileFormat with Logging {
+  ) extends com.nvidia.spark.rapids.delta.GpuDeltaParquetFileFormat {
 
   // Validate either we have all arguments for DV enabled read or none of them.
 
diff --git a/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase2.scala b/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase2.scala
index 48587ce3bca..b1a06781ec1 100644
--- a/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase2.scala
+++ b/delta-lake/common/src/main/delta-33x-41x/scala/com/nvidia/spark/rapids/delta/common/GpuDeltaParquetFileFormatBase2.scala
@@ -36,7 +36,6 @@ import org.apache.parquet.schema.MessageType
 
 import org.apache.spark.TaskContext
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.util.QuotingUtils
@@ -71,7 +70,7 @@ class GpuDeltaParquetFileFormatBase2(
     optimizationsEnabled: Boolean = true,
     tablePath: Option[String] = None,
     isCDCRead: Boolean = false
-) extends com.nvidia.spark.rapids.delta.GpuDeltaParquetFileFormat with Logging {
+) extends com.nvidia.spark.rapids.delta.GpuDeltaParquetFileFormat {
 
   // Validate either we have all arguments for DV enabled read or none of them.
 
@@ -443,11 +442,11 @@ class GpuDeltaParquetFileFormatBase2(
    * @param rowGroupNumRows number of rows in each row group
    * @param partitionIndex index into rowsPerPartition / allPartValues this file contributes to
    */
-  case class PerFileDVEntry(
-      dvDescriptor: Option[String],
-      rowGroupOffsets: Array[Long],
-      rowGroupNumRows: Array[Int],
-      partitionIndex: Int)
+  class PerFileDVEntry(
+      val dvDescriptor: Option[String],
+      val rowGroupOffsets: Array[Long],
+      val rowGroupNumRows: Array[Int],
+      val partitionIndex: Int)
 
   /**
    * Per-file DV load result produced during [[prepareForDecode]].
@@ -455,7 +454,7 @@ class GpuDeltaParquetFileFormatBase2(
    * @param gpuBitmap serialized roaring bitmap buffer for the file's deletion vector
    * @param aliveCount number of alive (non-deleted) rows in the file
    */
-  case class SerializedRoaringBitmap(gpuBitmap: SpillableHostBuffer, aliveCount: Long)
+  class SerializedRoaringBitmap(val gpuBitmap: SpillableHostBuffer, val aliveCount: Long)
 
   /**
    * Per-batch DV info that replaces [[ParquetExtraInfo]] in [[CurrentChunkMeta]] after batch
@@ -464,13 +463,13 @@ class GpuDeltaParquetFileFormatBase2(
    *  - [[loadedDVResults]] is filled in by [[prepareForDecode]] after the copy phase.
    *  [[perFileEntries]] and [[loadedDVResults]] are always parallel sequences of the same length.
    */
-  case class DeltaBatchExtraInfo(
+  class DeltaBatchExtraInfo(
       override val dateRebaseMode: DateTimeRebaseMode,
       override val timestampRebaseMode: DateTimeRebaseMode,
       override val hasInt96Timestamps: Boolean,
       val perFileEntries: Seq[PerFileDVEntry],
       // Filled by prepareForDecode() after the copy phase; empty until then.
-      val loadedDVResults: Seq[SerializedRoaringBitmap] = Seq.empty
+      val loadedDVResults: Seq[SerializedRoaringBitmap]
   ) extends ParquetExtraInfo(dateRebaseMode, timestampRebaseMode, hasInt96Timestamps) {
     /**
      * True if at least one file in this batch carries a deletion vector descriptor.
@@ -481,7 +480,8 @@ class GpuDeltaParquetFileFormatBase2(
      * Returns a copy of this instance with [[loadedDVResults]] set.
      */
     def withLoadedDVResults(loadedDVResults: Seq[SerializedRoaringBitmap]): DeltaBatchExtraInfo =
-      this.copy(loadedDVResults = loadedDVResults)
+      new DeltaBatchExtraInfo(dateRebaseMode, timestampRebaseMode, hasInt96Timestamps,
+        perFileEntries, loadedDVResults)
 
     /**
      * Closes the DV bitmaps in [[loadedDVResults]].
@@ -502,7 +502,7 @@ class GpuDeltaParquetFileFormatBase2(
       queryUsesInputFile: Boolean)
     extends AbstractGpuParquetMultiFilePartitionReaderFactory(sqlConf, broadcastedConf,
       dataSchema, readDataSchema, partitionSchema, filters, rapidsConf, poolConfBuilder,
-      metrics, queryUsesInputFile) with Logging {
+      metrics, queryUsesInputFile) {
 
     logDebug("Using GpuDeltaParquetMultiFilePartitionReaderFactory for multi-threaded Parquet " +
       "reading with deletion vectors")
@@ -584,11 +584,11 @@ class GpuDeltaParquetFileFormatBase2(
             val (rowGroupOffsets, rowGroupNumRows) =
               RapidsDeletionVectors.getRowGroupMetadata(singleFileInfo.blocks)
             clippedBlocks ++= singleFileInfo.blocks.zipWithIndex.map { case (block, i) =>
-              ParquetSingleDataBlockMeta(
+              new ParquetSingleDataBlockMeta(
                 singleFileInfo.filePath,
-                ParquetDataBlock(block, compressCfg),
+                new ParquetDataBlock(block, compressCfg),
                 metaAndFile.file.partitionValues,
-                ParquetSchemaWrapper(singleFileInfo.schema),
+                new ParquetSchemaWrapper(singleFileInfo.schema),
                 singleFileInfo.readSchema,
                 new DeltaParquetExtraInfo(
                   singleFileInfo.dateRebaseMode,
@@ -745,55 +745,53 @@ class GpuDeltaParquetFileFormatBase2(
     /**
      * Deletion vector metadata for a single host memory buffer containing a part of data.
      */
-    private case class SingleBufferDVMetadata(
-        maybeDvInfo: Option[SpillableDeletionVectorInfo]
-    )
-
-    private case class DeletionVectorMetadata(
-        metadatas: Array[SingleBufferDVMetadata]
-    )
-
-    private object DeletionVectorMetadata {
-      def forSingleBuffer(maybeDvInfo: Option[SpillableDeletionVectorInfo]) = {
-        DeletionVectorMetadata(
-          Array(
-            SingleBufferDVMetadata(maybeDvInfo)
-          )
+    private class SingleBufferDVMetadata(
+        val maybeDvInfo: Option[SpillableDeletionVectorInfo])
+
+    private class DeletionVectorMetadata(
+        val metadatas: Array[SingleBufferDVMetadata])
+
+    private def deletionVectorMetadataForSingleBuffer(
+        maybeDvInfo: Option[SpillableDeletionVectorInfo]): DeletionVectorMetadata = {
+      new DeletionVectorMetadata(
+        Array(
+          new SingleBufferDVMetadata(maybeDvInfo)
         )
-      }
+      )
+    }
 
-      def combine(metadatas: Array[DeletionVectorMetadata]): DeletionVectorMetadata = {
-        DeletionVectorMetadata(metadatas.flatMap(_.metadatas))
-      }
+    private def combineDeletionVectorMetadata(
+        metadatas: Array[DeletionVectorMetadata]): DeletionVectorMetadata = {
+      new DeletionVectorMetadata(metadatas.flatMap(_.metadatas))
     }
 
-    private case class DeltaParquetHostMemoryEmptyMetaData(
+    private class DeltaParquetHostMemoryEmptyMetaData(
         override val partitionedFile: PartitionedFile,
-        bufferSize: Long,
+        val bufferSize: Long,
         override val bytesRead: Long,
-        dateRebaseMode: DateTimeRebaseMode,
-        timestampRebaseMode: DateTimeRebaseMode,
-        hasInt96Timestamps: Boolean,
-        clippedSchema: MessageType,
-        readSchema: StructType,
-        numRows: Long,
-        dvMetadata: Array[DeletionVectorMetadata],
-        override val allPartValues: Option[Array[(Long, InternalRow)]] = None)
+        val dateRebaseMode: DateTimeRebaseMode,
+        val timestampRebaseMode: DateTimeRebaseMode,
+        val hasInt96Timestamps: Boolean,
+        val clippedSchema: MessageType,
+        val readSchema: StructType,
+        val numRows: Long,
+        val dvMetadata: Array[DeletionVectorMetadata],
+        override val allPartValues: Option[Array[(Long, InternalRow)]])
       extends HostMemoryEmptyMetaData {}
 
-    private case class DeltaParquetHostMemoryBuffersWithMetaData(
+    private class DeltaParquetHostMemoryBuffersWithMetaData(
         override val partitionedFile: PartitionedFile,
         override val memBuffersAndSizes: Array[SingleHMBAndMeta],
         override val bytesRead: Long,
-        dateRebaseMode: DateTimeRebaseMode,
-        timestampRebaseMode: DateTimeRebaseMode,
-        hasInt96Timestamps: Boolean,
-        clippedSchema: MessageType,
-        readSchema: StructType,
+        val dateRebaseMode: DateTimeRebaseMode,
+        val timestampRebaseMode: DateTimeRebaseMode,
+        val hasInt96Timestamps: Boolean,
+        val clippedSchema: MessageType,
+        val readSchema: StructType,
         override val allPartValues: Option[Array[(Long, InternalRow)]],
         // deletion vector metadata. should be aligned with memBuffersAndSizes if deletion vectors
         // are present.
-        dvMetadata: Array[DeletionVectorMetadata]
+        val dvMetadata: Array[DeletionVectorMetadata]
     ) extends HostMemoryBuffersWithMetaData {
 
       override def consumeHeadBuffer(): HostMemoryBuffersWithMetaData = {
@@ -806,7 +804,17 @@ class GpuDeltaParquetFileFormatBase2(
         } else {
           (Array.empty[SingleHMBAndMeta], Array.empty[DeletionVectorMetadata])
         }
-        this.copy(memBuffersAndSizes = remainingBuffers, dvMetadata = newDvMetadata)
+        new DeltaParquetHostMemoryBuffersWithMetaData(
+          partitionedFile,
+          remainingBuffers,
+          bytesRead,
+          dateRebaseMode,
+          timestampRebaseMode,
+          hasInt96Timestamps,
+          clippedSchema,
+          readSchema,
+          allPartValues,
+          newDvMetadata)
       }
     }
 
@@ -843,7 +851,7 @@ class GpuDeltaParquetFileFormatBase2(
       }
 
       closeOnExcept(maybeSerializedDV) { _ =>
-        val dvMetadata = DeletionVectorMetadata.forSingleBuffer(
+        val dvMetadata = deletionVectorMetadataForSingleBuffer(
           maybeSerializedDV.map{ serializedDV =>
             val (rowGroupOffsets, rowGroupNumRows) = RapidsDeletionVectors
               .getRowGroupMetadata(blocks)
@@ -853,7 +861,7 @@ class GpuDeltaParquetFileFormatBase2(
               rowGroupOffsets,
               rowGroupNumRows)}
         )
-        DeltaParquetHostMemoryEmptyMetaData(
+        new DeltaParquetHostMemoryEmptyMetaData(
           partitionedFile,
           bufferSize,
           bytesRead,
@@ -863,7 +871,8 @@ class GpuDeltaParquetFileFormatBase2(
           clippedSchema,
           readSchema,
           numRows,
-          Array(dvMetadata)
+          Array(dvMetadata),
+          None
         )
       }
     }
@@ -872,9 +881,9 @@ class GpuDeltaParquetFileFormatBase2(
         nonEmptyMeta: CombinedMeta): HostMemoryEmptyMetaData = {
       val metaForEmpty = emptyMeta.metaForEmpty
       val toCombine = emptyMeta.emptyMetas.map(_.asInstanceOf[DeltaParquetHostMemoryEmptyMetaData])
-      val combinedDVMeta = DeletionVectorMetadata.combine(toCombine.flatMap(_.dvMetadata))
+      val combinedDVMeta = combineDeletionVectorMetadata(toCombine.flatMap(_.dvMetadata))
 
-      DeltaParquetHostMemoryEmptyMetaData(
+      new DeltaParquetHostMemoryEmptyMetaData(
         metaForEmpty.partitionedFile, // just pick one since not used
         emptyMeta.emptyBufferSize,
         emptyMeta.emptyTotalBytesRead,
@@ -912,7 +921,7 @@ class GpuDeltaParquetFileFormatBase2(
             .map(_.asInstanceOf[ParquetDataBlock].dataBlock)
           val (rowGroupOffsets, rowGroupNumRows) = RapidsDeletionVectors
             .getRowGroupMetadata(dataBlocks)
-          DeletionVectorMetadata.forSingleBuffer(
+          deletionVectorMetadataForSingleBuffer(
             maybeSerializedDV.map { serializedDV =>
               serializedDV.incRefCount()
               SpillableDeletionVectorInfo(
@@ -923,7 +932,7 @@ class GpuDeltaParquetFileFormatBase2(
             })
         }
 
-        DeltaParquetHostMemoryBuffersWithMetaData(
+        new DeltaParquetHostMemoryBuffersWithMetaData(
           partitionedFile,
           memBuffersAndSize,
           bytesRead,
@@ -946,9 +955,9 @@ class GpuDeltaParquetFileFormatBase2(
       val metaToUse = combinedMeta.firstNonEmpty
       val toCombine = combinedMeta.toCombine
         .collect { case hmb: DeltaParquetHostMemoryBuffersWithMetaData => hmb }
-      val combinedDVMeta = DeletionVectorMetadata.combine(toCombine.flatMap(_.dvMetadata))
+      val combinedDVMeta = combineDeletionVectorMetadata(toCombine.flatMap(_.dvMetadata))
 
-      DeltaParquetHostMemoryBuffersWithMetaData(
+      new DeltaParquetHostMemoryBuffersWithMetaData(
         metaToUse.partitionedFile,
         Array(newHmbBufferInfo),
         offset,
@@ -1113,12 +1122,12 @@ class GpuDeltaParquetFileFormatBase2(
             fileNumRows += extra.rowGroupNumRows
           }
 
-          PerFileDVEntry(fileDesc, fileOffsets.toArray, fileNumRows.toArray, partitionIndex)
+          new PerFileDVEntry(fileDesc, fileOffsets.toArray, fileNumRows.toArray, partitionIndex)
       }.toSeq
 
       val batchExtra = new DeltaBatchExtraInfo(
         meta.extraInfo.dateRebaseMode, meta.extraInfo.timestampRebaseMode,
-        meta.extraInfo.hasInt96Timestamps, fileEntries)
+        meta.extraInfo.hasInt96Timestamps, fileEntries, Seq.empty)
       meta.copy(extraInfo = batchExtra)
     }
 
@@ -1160,7 +1169,7 @@ class GpuDeltaParquetFileFormatBase2(
               require(numDeleted <= totalRows,
                 s"Deletion vector cardinality ($numDeleted) exceeds " +
                   s"file row count ($totalRows)")
-              SerializedRoaringBitmap(gpuBitmap, totalRows - numDeleted)
+              new SerializedRoaringBitmap(gpuBitmap, totalRows - numDeleted)
             }
           }
         })
@@ -1238,8 +1247,8 @@ class GpuDeltaParquetFileFormatBase2(
  * A simple wrapper to adapt the DeletionVector.ParquetChunkedReader to the ChunkedReader interface
  * expected by AbstractParquetTableReader.
  */
-case class DeltaParquetChunkedReader(delegate: DeletionVector.ParquetChunkedReader)
-  extends ChunkedReader {
+class DeltaParquetChunkedReader(val delegate: DeletionVector.ParquetChunkedReader)
+  extends ChunkedReader with Serializable {
   override def hasNext: Boolean = delegate.hasNext
   override def next: Table = delegate.readChunk()
   override def close(): Unit = delegate.close()
@@ -1248,7 +1257,7 @@ case class DeltaParquetChunkedReader(delegate: DeletionVector.ParquetChunkedRead
 /**
  * A chunked reader for Parquet files with deletion vectors.
  */
-case class DeltaParquetTableReader(
+class DeltaParquetTableReader(
     conf: Configuration,
     chunkSizeByteLimit: Long,
     maxChunkedReaderMemoryUsageSizeBytes: Long,
@@ -1268,11 +1277,11 @@ case class DeltaParquetTableReader(
   conf, chunkSizeByteLimit, maxChunkedReaderMemoryUsageSizeBytes, opts, buffers, metrics,
   dateRebaseMode, timestampRebaseMode, isSchemaCaseSensitive, useFieldId, readDataSchema,
   clippedParquetSchema, splits, debugDumpPrefix, debugDumpAlways
-) {
+) with Serializable {
 
   logDebug("Using DeltaParquetTableReader for reading Parquet with deletion vectors")
 
-  override protected val reader = DeltaParquetChunkedReader(
+  override protected val reader = new DeltaParquetChunkedReader(
     DeletionVector.newParquetChunkedReader(chunkSizeByteLimit,
       maxChunkedReaderMemoryUsageSizeBytes, opts, buffers, dvInfos)
   )
@@ -1287,7 +1296,7 @@ case class DeltaParquetTableReader(
   }
 }
 
-object MakeParquetTableWithDVProducer extends Logging {
+object MakeParquetTableWithDVProducer extends RapidsLocalLog {
   def apply(
       useChunkedReader: Boolean,
       maxChunkedReaderMemoryUsageSizeBytes: Long,
@@ -1318,7 +1327,7 @@ object MakeParquetTableWithDVProducer extends Logging {
       }
     }
     if (useChunkedReader) {
-      DeltaParquetTableReader(conf, chunkSizeByteLimit, maxChunkedReaderMemoryUsageSizeBytes,
+      new DeltaParquetTableReader(conf, chunkSizeByteLimit, maxChunkedReaderMemoryUsageSizeBytes,
         opts, buffers, metrics, dateRebaseMode, timestampRebaseMode,
         isSchemaCaseSensitive, useFieldId, readDataSchema, clippedParquetSchema,
         splits, debugDumpPrefix, debugDumpAlways, deletionVectorInfos)
diff --git a/delta-lake/common/src/main/delta-33x-41x/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShimBase.scala b/delta-lake/common/src/main/delta-33x-41x/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShimBase.scala
index b72f13da81a..f59d892f73e 100644
--- a/delta-lake/common/src/main/delta-33x-41x/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShimBase.scala
+++ b/delta-lake/common/src/main/delta-33x-41x/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShimBase.scala
@@ -58,7 +58,7 @@ abstract class DeltaRuntimeShimBase extends DeltaRuntimeShim {
 
   override def startTransaction(log: DeltaLog, conf: RapidsConf, clock: Clock):
       GpuOptimisticTransactionBase = {
-    startTransaction(StartTransactionArg(log, conf, clock))
+    startTransaction(new StartTransactionArg(log, conf, clock))
   }
 
   override def startTransaction(arg: StartTransactionArg): GpuOptimisticTransactionBase = {
diff --git a/delta-lake/common/src/main/delta-33x/scala/com/nvidia/spark/rapids/delta/shims/StatsExprShim.scala b/delta-lake/common/src/main/delta-33x/scala/com/nvidia/spark/rapids/delta/shims/StatsExprShim.scala
index a388c5256f4..99c4f148f5d 100644
--- a/delta-lake/common/src/main/delta-33x/scala/com/nvidia/spark/rapids/delta/shims/StatsExprShim.scala
+++ b/delta-lake/common/src/main/delta-33x/scala/com/nvidia/spark/rapids/delta/shims/StatsExprShim.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -24,3 +24,4 @@ import org.apache.spark.sql.catalyst.expressions.Expression
 object StatsExprShim {
   def unwrapRuntimeReplaceable(expr: Expression): Expression = expr
 }
+// Keep executable line numbers aligned with older Delta shims for binary-dedupe.
diff --git a/delta-lake/common/src/main/delta-33x/scala/org/apache/spark/sql/delta/rapids/ShimDeltaInvariantCheckerExec.scala b/delta-lake/common/src/main/delta-33x/scala/org/apache/spark/sql/delta/rapids/ShimDeltaInvariantCheckerExec.scala
index a488356e6f2..52019f7db2a 100644
--- a/delta-lake/common/src/main/delta-33x/scala/org/apache/spark/sql/delta/rapids/ShimDeltaInvariantCheckerExec.scala
+++ b/delta-lake/common/src/main/delta-33x/scala/org/apache/spark/sql/delta/rapids/ShimDeltaInvariantCheckerExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -32,3 +32,4 @@ object ShimDeltaInvariantCheckerExec {
     DeltaInvariantCheckerExec(plan, constraints)
   }
 }
+// Keep executable line numbers aligned with older Delta shims for binary-dedupe.
diff --git a/delta-lake/common/src/main/delta-io/scala/com/nvidia/spark/rapids/delta/DeltaIOProvider.scala b/delta-lake/common/src/main/delta-io/scala/com/nvidia/spark/rapids/delta/DeltaIOProvider.scala
index 8fd372c0a1b..f04dc75ff69 100644
--- a/delta-lake/common/src/main/delta-io/scala/com/nvidia/spark/rapids/delta/DeltaIOProvider.scala
+++ b/delta-lake/common/src/main/delta-io/scala/com/nvidia/spark/rapids/delta/DeltaIOProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -106,10 +106,10 @@ abstract class DeltaIOProvider extends DeltaProviderImplBase {
       writeOptionsFromExec(cpuExec.writeOptions), cpuExec.session)
   }
 
-  private case class DeltaWriteV1Config(
-      deltaLog: DeltaLog,
-      forceOverwrite: Boolean,
-      options: mutable.HashMap[String, String])
+  private class DeltaWriteV1Config(
+      val deltaLog: DeltaLog,
+      val forceOverwrite: Boolean,
+      val options: mutable.HashMap[String, String])
 
   private def extractWriteV1Config(
       meta: RapidsMeta[_, _, _],
@@ -142,7 +142,7 @@ abstract class DeltaIOProvider extends DeltaProviderImplBase {
           f.get(outerObj).asInstanceOf[mutable.HashMap[String, String]]
         }
         if (forceOverwrite.isDefined && options.isDefined) {
-          Some(DeltaWriteV1Config(deltaLog, forceOverwrite.get, options.get))
+          Some(new DeltaWriteV1Config(deltaLog, forceOverwrite.get, options.get))
         } else {
           meta.willNotWorkOnGpu(s"write class has unsupported outer class $outerClass")
           None
diff --git a/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShim.scala b/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShim.scala
index 039368e7356..e6d02552d3b 100644
--- a/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShim.scala
+++ b/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/DeltaRuntimeShim.scala
@@ -30,15 +30,15 @@ import org.apache.spark.sql.execution.datasources.FileFormat
 import org.apache.spark.sql.expressions.UserDefinedFunction
 import org.apache.spark.util.Clock
 
-case class StartTransactionArg(log: DeltaLog, conf: RapidsConf, clock: Clock,
-    catalogTable: Option[CatalogTable] = None, snapshot: Option[Snapshot] = None)
+class StartTransactionArg(val log: DeltaLog, val conf: RapidsConf, val clock: Clock,
+    val catalogTable: Option[CatalogTable] = None, val snapshot: Option[Snapshot] = None)
 
 trait DeltaRuntimeShim {
   def getDeltaConfigChecker: DeltaConfigChecker
   def getDeltaProvider: DeltaProvider
   def startTransaction(log: DeltaLog, conf: RapidsConf, clock: Clock)
   : GpuOptimisticTransactionBase = {
-    startTransaction(StartTransactionArg(log, conf, clock))
+    startTransaction(new StartTransactionArg(log, conf, clock))
   }
   def startTransaction(arg: StartTransactionArg): GpuOptimisticTransactionBase
   def stringFromStringUdf(f: String => String): UserDefinedFunction
diff --git a/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuCheckDeltaInvariant.scala b/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuCheckDeltaInvariant.scala
index 67164017bbe..bcbbef9b9a4 100644
--- a/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuCheckDeltaInvariant.scala
+++ b/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuCheckDeltaInvariant.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * This file was derived from CheckDeltaInvariant.scala in the
  * Delta Lake project at https://github.com/delta-io/delta.
@@ -132,8 +132,8 @@ object GpuCheckDeltaInvariant extends Logging {
     ExprChecks.projectOnly(
       TypeSig.all,
       TypeSig.all,
-      paramCheck = Seq(ParamCheck("input", TypeSig.all, TypeSig.all)),
-      repeatingParamCheck = Some(RepeatingParamCheck("extra", TypeSig.all, TypeSig.all))
+      paramCheck = Seq(new ParamCheck("input", TypeSig.all, TypeSig.all)),
+      repeatingParamCheck = Some(new RepeatingParamCheck("extra", TypeSig.all, TypeSig.all))
     ),
     (c, conf, p, r) => new GpuCheckDeltaInvariantMeta(c, conf, p, r))
 
diff --git a/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuDeltaLog.scala b/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuDeltaLog.scala
index cdc0b7582e6..8fb66bfb4f2 100644
--- a/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuDeltaLog.scala
+++ b/delta-lake/common/src/main/delta-io/scala/org/apache/spark/sql/delta/rapids/GpuDeltaLog.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -40,7 +40,7 @@ class GpuDeltaLog(val deltaLog: DeltaLog, val rapidsConf: RapidsConf) {
    * directly to the DeltaLog otherwise they will not be checked for conflicts.
    */
   def startTransaction(): GpuOptimisticTransactionBase = {
-    DeltaRuntimeShim.startTransaction(StartTransactionArg(deltaLog, rapidsConf, _clock, None,
+    DeltaRuntimeShim.startTransaction(new StartTransactionArg(deltaLog, rapidsConf, _clock, None,
       None))
   }
 
@@ -62,7 +62,7 @@ class GpuDeltaLog(val deltaLog: DeltaLog, val rapidsConf: RapidsConf) {
   def startTransaction(
       catalogTableOpt: Option[CatalogTable],
       snapshotOpt: Option[Snapshot] = None): GpuOptimisticTransactionBase = {
-    DeltaRuntimeShim.startTransaction(StartTransactionArg(deltaLog, rapidsConf, _clock,
+    DeltaRuntimeShim.startTransaction(new StartTransactionArg(deltaLog, rapidsConf, _clock,
       catalogTableOpt, snapshotOpt))
   }
 
diff --git a/delta-lake/common/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaTaskStatisticsTracker.scala b/delta-lake/common/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaTaskStatisticsTracker.scala
index 4cbd693b01f..464368a326c 100644
--- a/delta-lake/common/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaTaskStatisticsTracker.scala
+++ b/delta-lake/common/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaTaskStatisticsTracker.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * This file was derived from DataSkippingStatsTracker.scala
  * in the Delta Lake project at https://github.com/delta-io/delta.
@@ -38,7 +38,7 @@ import org.apache.spark.sql.vectorized.ColumnarBatch
  * A [[WriteTaskStats]] that contains a map from file name to the json representation
  * of the collected statistics.
  */
-case class GpuDeltaFileStatistics(stats: Map[String, String]) extends WriteTaskStats
+class GpuDeltaFileStatistics(val stats: Map[String, String]) extends WriteTaskStats
 
 /**
  * GPU version of DeltaTaskStatisticsTracker.
@@ -168,7 +168,7 @@ class GpuDeltaTaskStatisticsTracker(
   }
 
   override def getFinalStats(taskCommitTime: Long): GpuDeltaFileStatistics = {
-    GpuDeltaFileStatistics(results.toMap)
+    new GpuDeltaFileStatistics(results.toMap)
   }
 }
 
diff --git a/delta-lake/delta-spark400db173/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaParquetFileFormatNativeDV.scala b/delta-lake/delta-spark400db173/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaParquetFileFormatNativeDV.scala
index 1e39cbc79ef..141b20bd339 100644
--- a/delta-lake/delta-spark400db173/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaParquetFileFormatNativeDV.scala
+++ b/delta-lake/delta-spark400db173/src/main/scala/com/nvidia/spark/rapids/delta/GpuDeltaParquetFileFormatNativeDV.scala
@@ -636,11 +636,11 @@ case class GpuDeltaParquetFileFormatNativeDV(
             val (rowGroupOffsets, rowGroupNumRows) =
               RapidsDeletionVectors.getRowGroupMetadata(singleFileInfo.blocks)
             clippedBlocks ++= singleFileInfo.blocks.zipWithIndex.map { case (block, i) =>
-              ParquetSingleDataBlockMeta(
+              new ParquetSingleDataBlockMeta(
                 singleFileInfo.filePath,
-                ParquetDataBlock(block, compressCfg),
+                new ParquetDataBlock(block, compressCfg),
                 metaAndFile.file.partitionValues,
-                ParquetSchemaWrapper(singleFileInfo.schema),
+                new ParquetSchemaWrapper(singleFileInfo.schema),
                 singleFileInfo.readSchema,
                 new DeltaParquetExtraInfo(
                   singleFileInfo.dateRebaseMode,
diff --git a/dist/README.md b/dist/README.md
index aa23b6a6332..840f9a52ee6 100644
--- a/dist/README.md
+++ b/dist/README.md
@@ -28,10 +28,8 @@ provider discovery mechanism
 [ParallelWorldClassloader](https://github.com/openjdk/jdk/blob/jdk8-b120/jaxws/src/share/jaxws_classes/com/sun/istack/internal/tools/ParallelWorldClassLoader.java)) 
 for each version of Spark supported in the jar, i.e., spark330/, spark341/, etc.
 
-If you have to change the contents of the uber jar the following files control what goes into the base jar as classes that are not shaded.
+If you have to change the contents of the uber jar, the packaging defaults common classes to the base jar when binary dedupe proves they are bitwise-identical across shims. New common classes should normally remain unshimmed by default. The following files control explicit exceptions and non-class resources.
 
-1. `unshimmed-common-from-single-shim.txt` - This has classes and files that should go into the base jar with their normal
-package name (not shaded). This includes user visible classes (i.e., com/nvidia/spark/SQLPlugin), python files,
-and other files that aren't version specific. Uses Spark 3.2.0 built jar for these base classes as explained above.
-2. `unshimmed-from-each-spark3xx.txt` - This is applied to all the individual Spark specific version jars to pull
-any files that need to go into the base of the jar and not into the Spark specific directory.
+1. `keep-in-spark-shared.txt` - Patterns for bitwise-identical common `spark-shared` class files that must stay in `spark-shared` instead of being promoted to the base jar. This should stay small; add entries only for compatibility or packaging exceptions.
+2. `unshimmed-common-from-single-shim.txt` - Files that must go into the base jar from one representative shim but are not selected by default class promotion, such as root `META-INF` resources and Python worker files. Avoid adding class files here unless they need special root-layout treatment outside bitwise-identical default promotion.
+3. `unshimmed-from-each-spark3xx.txt` - This is applied to all the individual Spark specific version jars to pull any files that need to go into the base of the jar and not into the Spark specific directory. These are per-shim root artifacts rather than common `spark-shared` classes.
diff --git a/dist/build/package-parallel-worlds.py b/dist/build/package-parallel-worlds.py
index 4698c4a8ca0..e612b05b490 100644
--- a/dist/build/package-parallel-worlds.py
+++ b/dist/build/package-parallel-worlds.py
@@ -26,6 +26,30 @@ def shell_exec(shell_cmd):
         self.fail("failed to execute %s" % shell_cmd)
 
 
+def has_fnmatch_magic(pattern):
+    return "*" in pattern or "?" in pattern or "[" in pattern
+
+
+def select_matching_members(namelist, patterns):
+    if os.environ.get("UNSHIM_FAST") != "1":
+        matching_members = []
+        for pat in patterns:
+            matching_members += fnmatch.filter(namelist, pat)
+        return matching_members
+
+    names_by_entry = {}
+    for name in namelist:
+        names_by_entry.setdefault(name, []).append(name)
+
+    matching_members = []
+    for pat in patterns:
+        if has_fnmatch_magic(pat):
+            matching_members += fnmatch.filter(namelist, pat)
+        else:
+            matching_members += names_by_entry.get(pat, [])
+    return matching_members
+
+
 artifacts = attributes.get('artifact_csv').split(',')
 buildver_list = re.sub(r'\s+', '', project.getProperty('included_buildvers'),
                        flags=re.UNICODE).split(',')
@@ -40,6 +64,12 @@ def shell_exec(shell_cmd):
 art_url = project.getProperty('env.ART_URL')
 jenkins_settings = os.sep.join([source_basedir, 'jenkins', 'settings.xml'])
 repo_local = project.getProperty('maven.repo.local')
+dist_dir = os.sep.join([source_basedir, 'dist'])
+with open(os.sep.join([dist_dir, 'unshimmed-common-from-single-shim.txt']), 'r') as f:
+    from_single_shim = f.read().splitlines()
+with open(os.sep.join([dist_dir, 'unshimmed-from-each-spark3xx.txt']), 'r') as f:
+    from_each = f.read().splitlines()
+from_single_shim_or_each = from_single_shim + from_each
 
 for bv in buildver_list:
     classifier = 'spark' + bv
@@ -73,11 +103,6 @@ def shell_exec(shell_cmd):
                 mvn_cmd.append('='.join(['-Dmaven.repo.local', repo_local]))
             shell_exec(mvn_cmd)
 
-        dist_dir = os.sep.join([source_basedir, 'dist'])
-        with open(os.sep.join([dist_dir, 'unshimmed-common-from-single-shim.txt']), 'r') as f:
-            from_single_shim = f.read().splitlines()
-        with open(os.sep.join([dist_dir, 'unshimmed-from-each-spark3xx.txt']), 'r') as f:
-            from_each = f.read().splitlines()
         with zipfile.ZipFile(os.sep.join([deps_dir, art_jar]), 'r') as zip_handle:
             if project.getProperty('should.build.conventional.jar'):
                 zip_handle.extractall(path=top_dist_jar_dir)
@@ -88,9 +113,6 @@ def shell_exec(shell_cmd):
                     zip_handle.extractall(path=top_dist_jar_dir)
                 # TODO deprecate
                 namelist = zip_handle.namelist()
-                matching_members = []
-                glob_list = from_single_shim + from_each if bv == buildver_list[0] else from_each
-                for pat in glob_list:
-                    new_matches = fnmatch.filter(namelist, pat)
-                    matching_members += new_matches
+                glob_list = from_single_shim_or_each if bv == buildver_list[0] else from_each
+                matching_members = select_matching_members(namelist, glob_list)
                 zip_handle.extractall(path=top_dist_jar_dir, members=matching_members)
diff --git a/dist/keep-in-spark-shared.txt b/dist/keep-in-spark-shared.txt
new file mode 100644
index 00000000000..5fc420febc9
--- /dev/null
+++ b/dist/keep-in-spark-shared.txt
@@ -0,0 +1,6 @@
+# Patterns for common spark-shared class files that must not be promoted to
+# the root layout even when binary dedupe marks them bitwise-identical.
+#
+# Add entries only when a class is bitwise-identical but must remain loaded
+# from spark-shared for compatibility or packaging reasons. New common classes
+# should normally stay unshimmed by default.
diff --git a/dist/maven-antrun/build-parallel-worlds.xml b/dist/maven-antrun/build-parallel-worlds.xml
index afde7c2d755..f6ccf8cb0b9 100644
--- a/dist/maven-antrun/build-parallel-worlds.xml
+++ b/dist/maven-antrun/build-parallel-worlds.xml
@@ -123,6 +123,10 @@
               failonerror="false">
             <env key="UNSHIMMED_COMMON_FROM_SINGLE_SHIM_TXT"
                  value="${spark.rapids.source.basedir}/${rapids.module}/unshimmed-common-from-single-shim.txt"/>
+            <env key="KEEP_IN_SPARK_SHARED_TXT"
+                 value="${spark.rapids.source.basedir}/${rapids.module}/keep-in-spark-shared.txt"/>
+            <env key="UNSHIM_ANALYZER_SCRIPT"
+                 value="${spark.rapids.source.basedir}/${rapids.module}/scripts/analyze-parallel-world-deps.py"/>
         </exec>
         <fail message="exec binary-dedupe.sh failed, exit code is ${build-parallel-worlds.dedupeExitCode}, error msg is ${build-parallel-worlds.dedupeErrorMsg}">
             <condition>
@@ -132,13 +136,14 @@
             </condition>
         </fail>
 
-        <!-- Remove the explicily unshimmed files from the common directory -->
+        <!-- Remove explicitly promoted non-class files from the common directory -->
         <delete>
             <fileset dir="${project.build.directory}/parallel-world/spark-shared"
                      includesfile="${spark.rapids.source.basedir}/${rapids.module}/unshimmed-common-from-single-shim.txt"/>
         </delete>
     </target>
-    <target name="remove-dependencies-from-pom" depends="build-parallel-worlds">
+    <target name="remove-dependencies-from-pom" depends="build-parallel-worlds"
+            unless="rapids.parallel.world.skip.reduced.pom">
         <echo level="info">Generating dependency-reduced-pom.xml</echo>
         <resources id="aggregatorDependencyRegexWithoutWhitespace">
             <string>&lt;dependency&gt;</string>
diff --git a/dist/scripts/analyze-parallel-world-deps.py b/dist/scripts/analyze-parallel-world-deps.py
new file mode 100644
index 00000000000..ab2867db7c4
--- /dev/null
+++ b/dist/scripts/analyze-parallel-world-deps.py
@@ -0,0 +1,617 @@
+#!/usr/bin/env python3
+
+# Copyright (c) 2026, NVIDIA CORPORATION.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Analyze dependencies between conventional, spark-shared, and shim classes.
+
+The dist jar contains classes in the conventional root layout, in spark-shared,
+and in one or more Spark-version-specific directories. This script inspects the
+class files and reports which root or spark-shared classes still have a static
+dependency path to version-specific bytecode.
+"""
+
+import argparse
+import collections
+import json
+import os
+import re
+import struct
+import sys
+import zipfile
+
+
+SHIM_DIR_RE = re.compile(r"^spark[0-9][0-9a-z]*$")
+CLASSIFIER_PACKAGE_RE = re.compile(r"(^|\.)spark[0-9][0-9a-z]*($|\.)")
+DESCRIPTOR_CLASS_RE = re.compile(r"L([^;<>\[\]\(\)]+);")
+
+DEFAULT_EXCLUDES = (
+    "ai.rapids.cudf.",
+    "com.nvidia.shaded.",
+    "org.openucx.",
+)
+
+
+ClassInfo = collections.namedtuple("ClassInfo", ("name", "location", "entry", "deps"))
+
+
+def _read_u1(data, offset):
+    return data[offset], offset + 1
+
+
+def _read_u2(data, offset):
+    return struct.unpack_from(">H", data, offset)[0], offset + 2
+
+
+def _read_u4(data, offset):
+    return struct.unpack_from(">I", data, offset)[0], offset + 4
+
+
+def _class_names_from_descriptor(value):
+    for match in DESCRIPTOR_CLASS_RE.finditer(value):
+        yield match.group(1)
+
+
+def _normalize_internal_name(value):
+    if not value:
+        return []
+    if value.startswith("["):
+        return list(_class_names_from_descriptor(value))
+    if "/" in value and not value.startswith("("):
+        return [value]
+    return list(_class_names_from_descriptor(value))
+
+
+def parse_class_file(data):
+    magic, offset = _read_u4(data, 0)
+    if magic != 0xCAFEBABE:
+        raise ValueError("not a class file")
+
+    # minor_version, major_version
+    _, offset = _read_u2(data, offset)
+    _, offset = _read_u2(data, offset)
+
+    cp_count, offset = _read_u2(data, offset)
+    constant_pool = [None] * cp_count
+    class_name_indexes = []
+    utf8_values = []
+
+    index = 1
+    while index < cp_count:
+        tag, offset = _read_u1(data, offset)
+        if tag == 1:  # CONSTANT_Utf8
+            length, offset = _read_u2(data, offset)
+            raw = data[offset:offset + length]
+            offset += length
+            value = raw.decode("utf-8", errors="replace")
+            constant_pool[index] = value
+            utf8_values.append(value)
+        elif tag in (3, 4):  # Integer, Float
+            offset += 4
+        elif tag in (5, 6):  # Long, Double
+            offset += 8
+            index += 1
+        elif tag == 7:  # Class
+            name_index, offset = _read_u2(data, offset)
+            constant_pool[index] = name_index
+            class_name_indexes.append(name_index)
+        elif tag == 8:  # String
+            offset += 2
+        elif tag in (9, 10, 11, 12, 17, 18):  # refs, NameAndType, Dynamic, InvokeDynamic
+            offset += 4
+        elif tag == 15:  # MethodHandle
+            offset += 3
+        elif tag in (16, 19, 20):  # MethodType, Module, Package
+            offset += 2
+        else:
+            raise ValueError("unknown constant pool tag %s" % tag)
+        index += 1
+
+    # access_flags
+    _, offset = _read_u2(data, offset)
+    this_class_index, offset = _read_u2(data, offset)
+    this_name_index = constant_pool[this_class_index]
+    this_name = constant_pool[this_name_index]
+
+    deps = set()
+    for name_index in class_name_indexes:
+        for dep in _normalize_internal_name(constant_pool[name_index]):
+            deps.add(dep.replace("/", "."))
+    for value in utf8_values:
+        for dep in _class_names_from_descriptor(value):
+            deps.add(dep.replace("/", "."))
+
+    class_name = this_name.replace("/", ".")
+    deps.discard(class_name)
+    return class_name, deps
+
+
+def location_from_entry(entry):
+    first = entry.split("/", 1)[0]
+    if first == "spark-shared":
+        return "spark-shared"
+    if SHIM_DIR_RE.match(first):
+        return first
+    return "root"
+
+
+def is_classifier_class(class_name):
+    return bool(CLASSIFIER_PACKAGE_RE.search(class_name))
+
+
+def is_version_location(location):
+    return bool(SHIM_DIR_RE.match(location))
+
+
+def is_version_node(node):
+    class_name, location = node
+    return is_version_location(location) or is_classifier_class(class_name)
+
+
+def iter_class_entries(path):
+    if zipfile.is_zipfile(path):
+        with zipfile.ZipFile(path) as zf:
+            for name in zf.namelist():
+                if name.endswith(".class") and not name.endswith("/module-info.class"):
+                    yield name, zf.read(name)
+        return
+
+    for root, _, files in os.walk(path):
+        for file_name in files:
+            if not file_name.endswith(".class") or file_name == "module-info.class":
+                continue
+            full_path = os.path.join(root, file_name)
+            rel_path = os.path.relpath(full_path, path).replace(os.sep, "/")
+            with open(full_path, "rb") as fh:
+                yield rel_path, fh.read()
+
+
+def should_exclude(class_name, prefixes):
+    return any(class_name.startswith(prefix) for prefix in prefixes)
+
+
+def load_classes(path, exclude_prefixes):
+    classes = {}
+    name_locations = collections.defaultdict(set)
+    errors = []
+    for entry, data in iter_class_entries(path):
+        try:
+            class_name, deps = parse_class_file(data)
+        except ValueError as exc:
+            errors.append("%s: %s" % (entry, exc))
+            continue
+        if should_exclude(class_name, exclude_prefixes):
+            continue
+        location = location_from_entry(entry)
+        info = ClassInfo(class_name, location, entry, deps)
+        node = (class_name, location)
+        classes[node] = info
+        name_locations[class_name].add(location)
+    return classes, name_locations, errors
+
+
+def resolve_dependency_targets(source_location, dep_name, name_locations):
+    locations = name_locations.get(dep_name)
+    if not locations:
+        return []
+
+    # Parent/root class loading wins in the current layout. Prefer a conventional
+    # class when one exists, then the source archive, then spark-shared, then the
+    # remaining version-specific locations.
+    ordered = []
+    for preferred in ("root", source_location, "spark-shared"):
+        if preferred in locations and preferred not in ordered:
+            ordered.append(preferred)
+    ordered.extend(sorted(loc for loc in locations if loc not in ordered))
+    return [(dep_name, loc) for loc in ordered]
+
+
+def build_graph(classes, name_locations):
+    graph = {node: set() for node in classes}
+    for node, info in classes.items():
+        for dep_name in info.deps:
+            for target in resolve_dependency_targets(info.location, dep_name, name_locations):
+                if target in classes:
+                    graph[node].add(target)
+    return graph
+
+
+def reverse_graph(graph):
+    rev = {node: set() for node in graph}
+    for source, targets in graph.items():
+        for target in targets:
+            rev[target].add(source)
+    return rev
+
+
+def reachable_to_version_specific(graph):
+    rev = reverse_graph(graph)
+    version_nodes = {node for node in graph if is_version_node(node)}
+    marked = set(version_nodes)
+    queue = collections.deque(version_nodes)
+    while queue:
+        node = queue.popleft()
+        for parent in rev[node]:
+            if parent not in marked:
+                marked.add(parent)
+                queue.append(parent)
+    return marked, version_nodes
+
+
+def shortest_path_to_version(graph, start):
+    queue = collections.deque([(start, [start])])
+    seen = {start}
+    while queue:
+        node, path = queue.popleft()
+        if node != start and is_version_node(node):
+            return path
+        for next_node in sorted(graph[node]):
+            if next_node not in seen:
+                seen.add(next_node)
+                queue.append((next_node, path + [next_node]))
+    return None
+
+
+def tarjan_scc(graph):
+    sys.setrecursionlimit(max(sys.getrecursionlimit(), len(graph) * 2 + 1000))
+
+    index = 0
+    stack = []
+    on_stack = set()
+    indexes = {}
+    lowlinks = {}
+    components = []
+
+    def strongconnect(node):
+        nonlocal index
+        indexes[node] = index
+        lowlinks[node] = index
+        index += 1
+        stack.append(node)
+        on_stack.add(node)
+
+        for next_node in graph[node]:
+            if next_node not in indexes:
+                strongconnect(next_node)
+                lowlinks[node] = min(lowlinks[node], lowlinks[next_node])
+            elif next_node in on_stack:
+                lowlinks[node] = min(lowlinks[node], indexes[next_node])
+
+        if lowlinks[node] == indexes[node]:
+            component = []
+            while True:
+                item = stack.pop()
+                on_stack.remove(item)
+                component.append(item)
+                if item == node:
+                    break
+            components.append(component)
+
+    for node in graph:
+        if node not in indexes:
+            strongconnect(node)
+    return components
+
+
+def dependency_first_component_order(graph, components):
+    comp_by_node = {}
+    for comp_id, component in enumerate(components):
+        for node in component:
+            comp_by_node[node] = comp_id
+
+    # Source -> target means "source depends on target". Reverse component
+    # edges so Kahn's algorithm emits dependencies before their users.
+    prereq_edges = collections.defaultdict(set)
+    indegree = collections.Counter()
+    for source, targets in graph.items():
+        source_comp = comp_by_node[source]
+        indegree.setdefault(source_comp, 0)
+        for target in targets:
+            target_comp = comp_by_node[target]
+            if source_comp == target_comp:
+                continue
+            if source_comp not in prereq_edges[target_comp]:
+                prereq_edges[target_comp].add(source_comp)
+                indegree[source_comp] += 1
+                indegree.setdefault(target_comp, indegree[target_comp])
+
+    ready = collections.deque(sorted(
+        comp_id for comp_id in range(len(components)) if indegree[comp_id] == 0))
+    ordered = []
+    while ready:
+        comp_id = ready.popleft()
+        ordered.append(comp_id)
+        for dependent in sorted(prereq_edges[comp_id]):
+            indegree[dependent] -= 1
+            if indegree[dependent] == 0:
+                ready.append(dependent)
+    return ordered
+
+
+def format_node(node):
+    class_name, location = node
+    return "%s (%s)" % (class_name, location)
+
+
+def print_path(path):
+    return " -> ".join(format_node(node) for node in path)
+
+
+def json_node(node):
+    class_name, location = node
+    return {
+        "className": class_name,
+        "location": location,
+    }
+
+
+def location_relative_entry(info):
+    parts = info.entry.split("/", 1)
+    if info.location == "root":
+        return info.entry
+    if len(parts) == 2:
+        return parts[1]
+    return info.entry
+
+
+def direct_classifier_edges(graph):
+    edges = []
+    for source, targets in graph.items():
+        if is_classifier_class(source[0]):
+            continue
+        for target in targets:
+            if is_classifier_class(target[0]):
+                edges.append((source, target))
+    return sorted(edges)
+
+
+def version_blocker_counts(graph, version_nodes, root_or_shared):
+    """Count root/shared classes that can reach each version-specific node."""
+    rev = reverse_graph(graph)
+    counts = []
+    for version_node in sorted(version_nodes):
+        seen = {version_node}
+        queue = collections.deque([version_node])
+        impacted = set()
+        while queue:
+            node = queue.popleft()
+            for parent in rev[node]:
+                if parent in seen:
+                    continue
+                seen.add(parent)
+                queue.append(parent)
+                if parent in root_or_shared:
+                    impacted.add(parent)
+        if impacted:
+            counts.append((len(impacted), version_node))
+    return sorted(counts, key=lambda item: (-item[0], item[1]))
+
+
+def nearest_version_target_counts(graph, blocked):
+    """Count terminal version nodes from each blocked node's shortest path."""
+    rev = reverse_graph(graph)
+    distance = {}
+    queue = collections.deque()
+    for node in sorted(node for node in graph if is_version_node(node)):
+        distance[node] = 0
+        queue.append(node)
+
+    while queue:
+        node = queue.popleft()
+        for parent in sorted(rev[node]):
+            if parent in distance:
+                continue
+            distance[parent] = distance[node] + 1
+            queue.append(parent)
+
+    def rebuild_path(start):
+        path = [start]
+        node = start
+        while not is_version_node(node):
+            next_node = None
+            for candidate in sorted(graph[node]):
+                if distance.get(candidate) == distance[node] - 1:
+                    next_node = candidate
+                    break
+            if next_node is None:
+                return None
+            path.append(next_node)
+            node = next_node
+        return path
+
+    counts = collections.Counter()
+    examples = {}
+    paths = []
+    for node in blocked:
+        if node not in distance:
+            continue
+        path = rebuild_path(node)
+        if not path:
+            continue
+        paths.append((node, path))
+        target = path[-1]
+        counts[target] += 1
+        examples.setdefault(target, path)
+    ranked = sorted(
+        ((count, target, examples[target]) for target, count in counts.items()),
+        key=lambda item: (-item[0], item[1]))
+    return ranked, paths
+
+
+def main():
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument("path", help="dist/target/parallel-world directory or a dist jar")
+    parser.add_argument("--limit", type=int, default=20,
+        help="maximum number of examples to print per section")
+    parser.add_argument("--exclude-prefix", action="append", default=[],
+        help="class name prefix to exclude; may be passed more than once")
+    parser.add_argument("--show-safe", action="store_true",
+        help="print examples of spark-shared classes with no path to version-specific code")
+    parser.add_argument("--show-topo", action="store_true",
+        help="print root-safe spark-shared SCCs in dependency-first order")
+    parser.add_argument("--show-reachability", action="store_true",
+        help="print overlapping reachability counts for version-specific nodes")
+    parser.add_argument("--format", choices=("text", "json"), default="text",
+        help="output format")
+    parser.add_argument("--write-safe-paths",
+        help="write root-safe spark-shared class paths, one per line")
+    args = parser.parse_args()
+
+    exclude_prefixes = tuple(DEFAULT_EXCLUDES) + tuple(args.exclude_prefix)
+    classes, name_locations, errors = load_classes(args.path, exclude_prefixes)
+    graph = build_graph(classes, name_locations)
+    contaminated, version_nodes = reachable_to_version_specific(graph)
+    components = tarjan_scc(graph)
+    component_order = dependency_first_component_order(graph, components)
+
+    by_location = collections.Counter(info.location for info in classes.values())
+    root_or_shared = {
+        node for node, info in classes.items()
+        if info.location in ("root", "spark-shared") and not is_classifier_class(info.name)
+    }
+    blocked = sorted(root_or_shared & contaminated)
+    safe_shared = sorted(
+        node for node in root_or_shared - contaminated
+        if classes[node].location == "spark-shared")
+    classifier_edges = direct_classifier_edges(graph)
+    version_components = [comp for comp in components if any(is_version_node(node) for node in comp)]
+    safe_sccs = []
+    for comp_id in component_order:
+        component = components[comp_id]
+        safe_members = sorted(node for node in component if node in safe_shared)
+        if safe_members:
+            safe_sccs.append((comp_id, safe_members))
+    version_blockers = (
+        version_blocker_counts(graph, version_nodes, root_or_shared)
+        if args.show_reachability or args.format == "json" else [])
+    nearest_targets, blocked_paths = nearest_version_target_counts(graph, blocked)
+    safe_shared_paths = sorted(location_relative_entry(classes[node]) for node in safe_shared)
+
+    if args.write_safe_paths:
+        with open(args.write_safe_paths, "w", encoding="utf-8") as out:
+            for path in safe_shared_paths:
+                out.write(path)
+                out.write("\n")
+
+    if args.format == "json":
+        output = {
+            "path": args.path,
+            "classCount": len(classes),
+            "locationCounts": dict(sorted(by_location.items())),
+            "versionSpecificNodeCount": len(version_nodes),
+            "rootOrSharedBlockedCount": len(blocked),
+            "rootSafeSparkSharedCount": len(safe_shared),
+            "sccCount": len(components),
+            "versionSpecificSccCount": len(version_components),
+            "directClassifierDependencyCount": len(classifier_edges),
+            "rootSafeSparkSharedPaths": safe_shared_paths,
+            "directClassifierDependencyExamples": [
+                {
+                    "source": json_node(source),
+                    "target": json_node(target),
+                }
+                for source, target in classifier_edges[:args.limit]
+            ],
+            "topVersionBlockersByReachability": [
+                {
+                    "blockedRootOrSharedCount": count,
+                    "target": json_node(target),
+                }
+                for count, target in version_blockers[:args.limit]
+            ],
+            "nearestVersionTargetCounts": [
+                {
+                    "blockedShortestPathCount": count,
+                    "target": json_node(target),
+                    "examplePath": [json_node(node) for node in path],
+                }
+                for count, target, path in nearest_targets[:args.limit]
+            ],
+            "rootSafeSparkSharedSccCount": len(safe_sccs),
+            "rootSafeSparkSharedSccExamples": [
+                {
+                    "componentId": comp_id,
+                    "classCount": len(members),
+                    "classExamples": [json_node(node) for node in members[:args.limit]],
+                }
+                for comp_id, members in safe_sccs[:args.limit]
+            ],
+            "blockedExamples": [
+                [json_node(node) for node in path]
+                for _, path in blocked_paths[:args.limit]
+            ],
+        }
+        json.dump(output, sys.stdout, indent=2, sort_keys=True)
+        print()
+        return
+
+    print("Loaded %d classes from %s" % (len(classes), args.path))
+    if errors:
+        print("Skipped %d malformed class files" % len(errors))
+    print("Class locations:")
+    for location, count in sorted(by_location.items()):
+        print("  %s: %d" % (location, count))
+    print("Version-specific/classifier nodes: %d" % len(version_nodes))
+    print("Root or spark-shared nodes with a path to version-specific code: %d" % len(blocked))
+    print("Root-safe spark-shared nodes: %d" % len(safe_shared))
+    print("SCCs: %d total, %d containing version-specific code" %
+        (len(components), len(version_components)))
+
+    print("\nDirect classifier-package dependencies: %d" % len(classifier_edges))
+    for source, target in classifier_edges[:args.limit]:
+        print("  %s -> %s" % (format_node(source), format_node(target)))
+    if len(classifier_edges) > args.limit:
+        print("  ... %d more" % (len(classifier_edges) - args.limit))
+
+    if args.show_reachability:
+        print("\nTop version-specific blockers by upstream root/shared reachability:")
+        for count, target in version_blockers[:args.limit]:
+            print("  %d <- %s" % (count, format_node(target)))
+        if len(version_blockers) > args.limit:
+            print("  ... %d more" % (len(version_blockers) - args.limit))
+
+    print("\nNearest version targets from shortest blocked paths:")
+    for count, target, path in nearest_targets[:args.limit]:
+        print("  %d -> %s" % (count, format_node(target)))
+        print("    e.g. %s" % print_path(path))
+    if len(nearest_targets) > args.limit:
+        print("  ... %d more" % (len(nearest_targets) - args.limit))
+
+    print("\nNearest paths from root/spark-shared code to version-specific code:")
+    for _, path in blocked_paths[:args.limit]:
+        print("  %s" % print_path(path))
+    if len(blocked) > args.limit:
+        print("  ... %d more blocked classes" % (len(blocked) - args.limit))
+
+    if args.show_safe:
+        print("\nSpark-shared classes with no path to version-specific code:")
+        for node in safe_shared[:args.limit]:
+            print("  %s" % format_node(node))
+        if len(safe_shared) > args.limit:
+            print("  ... %d more" % (len(safe_shared) - args.limit))
+
+    if args.show_topo:
+        print("\nRoot-safe spark-shared SCCs in dependency-first order:")
+        for printed, (comp_id, safe_members) in enumerate(safe_sccs):
+            print("  component %d, %d class(es)" % (comp_id, len(safe_members)))
+            for node in safe_members[:3]:
+                print("    %s" % format_node(node))
+            if len(safe_members) > 3:
+                print("    ... %d more in component" % (len(safe_members) - 3))
+            if printed + 1 >= args.limit:
+                break
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/dist/scripts/binary-dedupe.sh b/dist/scripts/binary-dedupe.sh
index 2054e18ccf9..ea3ac931413 100755
--- a/dist/scripts/binary-dedupe.sh
+++ b/dist/scripts/binary-dedupe.sh
@@ -35,10 +35,34 @@ esac
 
 STEP=0
 export SPARK_SHARED_TXT="$PWD/spark-shared.txt"
+export SPARK_SHARED_CLASSES_TXT="$PWD/spark-shared-classes.txt"
 export SPARK_SHARED_COPY_LIST="$PWD/spark-shared-copy-list.txt"
 export DELETE_DUPLICATES_TXT="$PWD/delete-duplicates.txt"
 export SPARK_SHARED_DIR="$PWD/spark-shared"
 export UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST="$PWD/unshimmed-from-spark-shared-copy-list.txt"
+export ROOT_SAFE_SPARK_SHARED_TXT="$PWD/root-safe-spark-shared.txt"
+export DEFAULT_UNSHIMMED_SPARK_SHARED_TXT="$PWD/default-unshimmed-spark-shared.txt"
+export UNSHIMMED_NEED_SHARED_TXT="$PWD/unshimmed-need-shared.txt"
+export UNSHIMMED_MISSING_SHARED_TXT="$PWD/unshimmed-missing-shared.txt"
+
+SPARK_SHIM_DIRS=()
+if [[ "${UNSHIM_FAST:-0}" == "1" ]]; then
+  while IFS= read -r shim_dir; do
+    SPARK_SHIM_DIRS+=("$shim_dir")
+  done < <(find ./parallel-world -maxdepth 1 -mindepth 1 -type d -name 'spark[34]*' | sort)
+fi
+
+DEDUPE_CACHE_DIR="${UNSHIM_DEDUPE_CACHE_DIR:-}"
+DEDUPE_CACHE_SPARK_SHARED_TXT=""
+DEDUPE_CACHE_SHA1_FILES_TXT=""
+DEDUPE_CACHE_SHIM_SHA_PACKAGE_FILES_TXT=""
+DEDUPE_CACHE_COUNT_SHIM_SHA_PACKAGE_FILES_TXT=""
+if [[ -n "$DEDUPE_CACHE_DIR" ]]; then
+  DEDUPE_CACHE_SPARK_SHARED_TXT="$DEDUPE_CACHE_DIR/spark-shared.txt"
+  DEDUPE_CACHE_SHA1_FILES_TXT="$DEDUPE_CACHE_DIR/tmp-sha1-files.txt"
+  DEDUPE_CACHE_SHIM_SHA_PACKAGE_FILES_TXT="$DEDUPE_CACHE_DIR/tmp-shim-sha-package-files.txt"
+  DEDUPE_CACHE_COUNT_SHIM_SHA_PACKAGE_FILES_TXT="$DEDUPE_CACHE_DIR/tmp-count-shim-sha-package-files.txt"
+fi
 
 # This script de-duplicates .class files at the binary level.
 # We could also diff classes using scalap / javap outputs.
@@ -55,24 +79,54 @@ export UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST="$PWD/unshimmed-from-spark-shared-c
 # - put the path starting with /sparkxyz back together for the final list
 echo "Retrieving class files hashing to a single value ..."
 
-
-echo "$((++STEP))/ SHA1 of all non-META files > tmp-sha1-files.txt"
-find ./parallel-world/spark[34]* -name META-INF -prune -o -name webapps -prune -o \( -type f -print0 \) | \
-  xargs --null $SHASUM > tmp-sha1-files.txt
-
-echo "$((++STEP))/ make shim column 1 > tmp-shim-sha-package-files.txt"
-< tmp-sha1-files.txt awk -F/ '$1=$1' | \
-  awk '{checksum=$1; shim=$4; $1=shim; $2=$3=""; $4=checksum;  print $0}' | \
-  tr -s  ' ' > tmp-shim-sha-package-files.txt
-
-echo "$((++STEP))/ sort by path, sha1; output first from each group > tmp-count-shim-sha-package-files.txt"
-sort -k3 -k2,2 -u tmp-shim-sha-package-files.txt | \
-  uniq -f 2 -c > tmp-count-shim-sha-package-files.txt
-
-echo "$((++STEP))/ files with unique sha1 > $SPARK_SHARED_TXT"
-grep '^\s\+1 .*' tmp-count-shim-sha-package-files.txt | \
-  awk '{$1=""; $3=""; print $0 }' | \
-  tr -s ' ' | sed 's/\ /\//g' > "$SPARK_SHARED_TXT"
+CACHE_HIT=0
+if [[ -n "$DEDUPE_CACHE_SPARK_SHARED_TXT" && \
+      -f "$DEDUPE_CACHE_SPARK_SHARED_TXT" && \
+      -f "$DEDUPE_CACHE_SHA1_FILES_TXT" && \
+      -f "$DEDUPE_CACHE_SHIM_SHA_PACKAGE_FILES_TXT" && \
+      -f "$DEDUPE_CACHE_COUNT_SHIM_SHA_PACKAGE_FILES_TXT" ]]; then
+  echo "$((++STEP))/ reusing cached files with unique sha1 > $SPARK_SHARED_TXT"
+  cp "$DEDUPE_CACHE_SPARK_SHARED_TXT" "$SPARK_SHARED_TXT"
+  cp "$DEDUPE_CACHE_SHA1_FILES_TXT" tmp-sha1-files.txt
+  cp "$DEDUPE_CACHE_SHIM_SHA_PACKAGE_FILES_TXT" tmp-shim-sha-package-files.txt
+  cp "$DEDUPE_CACHE_COUNT_SHIM_SHA_PACKAGE_FILES_TXT" tmp-count-shim-sha-package-files.txt
+  CACHE_HIT=1
+# With one shim there is no cross-shim identity proof to perform; every
+# non-META file is the sole representative for its path.
+elif [[ "${UNSHIM_FAST:-0}" == "1" && "${#SPARK_SHIM_DIRS[@]}" == "1" ]]; then
+  echo "$((++STEP))/ single shim fast path; listing files > $SPARK_SHARED_TXT"
+  : > tmp-sha1-files.txt
+  : > tmp-shim-sha-package-files.txt
+  : > tmp-count-shim-sha-package-files.txt
+  find "${SPARK_SHIM_DIRS[0]}" -name META-INF -prune -o -name webapps -prune -o \( -type f -print \) | \
+    sort | sed 's|^\./parallel-world||' > "$SPARK_SHARED_TXT"
+else
+  echo "$((++STEP))/ SHA1 of all non-META files > tmp-sha1-files.txt"
+  find ./parallel-world/spark[34]* -name META-INF -prune -o -name webapps -prune -o \( -type f -print0 \) | \
+    xargs --null $SHASUM > tmp-sha1-files.txt
+
+  echo "$((++STEP))/ make shim column 1 > tmp-shim-sha-package-files.txt"
+  < tmp-sha1-files.txt awk -F/ '$1=$1' | \
+    awk '{checksum=$1; shim=$4; $1=shim; $2=$3=""; $4=checksum;  print $0}' | \
+    tr -s  ' ' > tmp-shim-sha-package-files.txt
+
+  echo "$((++STEP))/ sort by path, sha1; output first from each group > tmp-count-shim-sha-package-files.txt"
+  sort -k3 -k2,2 -u tmp-shim-sha-package-files.txt | \
+    uniq -f 2 -c > tmp-count-shim-sha-package-files.txt
+
+  echo "$((++STEP))/ files with unique sha1 > $SPARK_SHARED_TXT"
+  grep '^\s\+1 .*' tmp-count-shim-sha-package-files.txt | \
+    awk '{$1=""; $3=""; print $0 }' | \
+    tr -s ' ' | sed 's/\ /\//g' > "$SPARK_SHARED_TXT"
+fi
+
+if [[ "$CACHE_HIT" == "0" && -n "$DEDUPE_CACHE_SPARK_SHARED_TXT" ]]; then
+  mkdir -p "$DEDUPE_CACHE_DIR"
+  cp "$SPARK_SHARED_TXT" "$DEDUPE_CACHE_SPARK_SHARED_TXT"
+  cp tmp-sha1-files.txt "$DEDUPE_CACHE_SHA1_FILES_TXT"
+  cp tmp-shim-sha-package-files.txt "$DEDUPE_CACHE_SHIM_SHA_PACKAGE_FILES_TXT"
+  cp tmp-count-shim-sha-package-files.txt "$DEDUPE_CACHE_COUNT_SHIM_SHA_PACKAGE_FILES_TXT"
+fi
 
 function retain_single_copy() {
   set -e
@@ -100,9 +154,10 @@ function retain_single_copy() {
   done >> "$DELETE_DUPLICATES_TXT" || exit 255
 }
 
-function copy_unshimmed_from_spark_shared() {
+function append_matching_spark_shared_patterns() {
   set -e
-  local unshimmed_patterns_txt="${UNSHIMMED_COMMON_FROM_SINGLE_SHIM_TXT:-}"
+  local unshimmed_patterns_txt="$1"
+  local output_txt="$2"
 
   [[ -n "$unshimmed_patterns_txt" ]] || return 0
   [[ -f "$unshimmed_patterns_txt" ]] || {
@@ -110,23 +165,102 @@ function copy_unshimmed_from_spark_shared() {
     exit 255
   }
 
-  : > "$UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST"
-  while read -r shared_path; do
-    local rel_path="${shared_path#./parallel-world/spark-shared/}"
-    local pattern
-    while read -r pattern; do
-      [[ -n "$pattern" ]] || continue
-      [[ "$pattern" =~ ^[[:space:]]*# ]] && continue
-      # shellcheck disable=SC2053
-      if [[ "$rel_path" == $pattern ]]; then
-        echo "$rel_path" >> "$UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST"
-        break
-      fi
-    done < "$unshimmed_patterns_txt"
-  done < <(find ./parallel-world/spark-shared -type f)
+  local shared_dir="./parallel-world/spark-shared"
+  local pattern
+  while IFS= read -r pattern; do
+    [[ -n "$pattern" ]] || continue
+    [[ "$pattern" =~ ^[[:space:]]*# ]] && continue
+    case "$pattern" in
+      *[\*\?\[]*)
+        find "$shared_dir" -type f -path "$shared_dir/$pattern" |
+          sed "s|^\./parallel-world/spark-shared/||" >> "$output_txt"
+        ;;
+      *)
+        if [[ -f "$shared_dir/$pattern" ]]; then
+          echo "$pattern" >> "$output_txt"
+        fi
+        ;;
+    esac
+  done < "$unshimmed_patterns_txt"
+}
+
+function write_root_safe_spark_shared_classes() {
+  set -e
+  local analyzer_script="${UNSHIM_ANALYZER_SCRIPT:-}"
+  if [[ -z "$analyzer_script" && -n "${UNSHIMMED_COMMON_FROM_SINGLE_SHIM_TXT:-}" ]]; then
+    analyzer_script="$(dirname "$UNSHIMMED_COMMON_FROM_SINGLE_SHIM_TXT")/scripts/analyze-parallel-world-deps.py"
+  fi
+  [[ -n "$analyzer_script" && -f "$analyzer_script" ]] || {
+    echo >&2 "Cannot locate analyze-parallel-world-deps.py for default unshim analysis"
+    exit 255
+  }
+
+  echo "$((++STEP))/ analyzing spark-shared dependency paths > $ROOT_SAFE_SPARK_SHARED_TXT"
+  python3 "$analyzer_script" ./parallel-world \
+    --write-safe-paths "$ROOT_SAFE_SPARK_SHARED_TXT"
+}
 
+function write_default_unshimmed_spark_shared_classes() {
+  set -e
+  echo "$((++STEP))/ selecting all bitwise-identical spark-shared classes > $DEFAULT_UNSHIMMED_SPARK_SHARED_TXT"
+  sed -E "s|^/spark[^/]*/||" "$SPARK_SHARED_TXT" | \
+    grep '\.class$' | sort -u > "$DEFAULT_UNSHIMMED_SPARK_SHARED_TXT"
+}
+
+function keep_in_spark_shared() {
+  set -e
+  local class_file="$1"
+  local keep_patterns_txt="${KEEP_IN_SPARK_SHARED_TXT:-}"
+  [[ -n "$keep_patterns_txt" ]] || return 1
+  [[ -f "$keep_patterns_txt" ]] || {
+    echo >&2 "Keep-in-spark-shared list does not exist: $keep_patterns_txt"
+    exit 255
+  }
+
+  local pattern
+  while IFS= read -r pattern; do
+    [[ -n "$pattern" ]] || continue
+    [[ "$pattern" =~ ^[[:space:]]*# ]] && continue
+    # shellcheck disable=SC2053
+    if [[ "$class_file" == $pattern ]]; then
+      return 0
+    fi
+  done < "$keep_patterns_txt"
+  return 1
+}
+
+function filter_keep_in_spark_shared() {
+  set -e
+  local input_txt="$1"
+  local output_txt="$2"
+  local class_file
+  : > "$output_txt"
+  while IFS= read -r class_file; do
+    [[ -n "$class_file" ]] || continue
+    if keep_in_spark_shared "$class_file"; then
+      continue
+    fi
+    echo "$class_file"
+  done < "$input_txt" > "$output_txt.tmp"
+  mv "$output_txt.tmp" "$output_txt"
+}
+
+function copy_unshimmed_from_spark_shared() {
+  set -e
+  local raw_copy_list="$UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST.raw"
+  local sorted_copy_list="$UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST.sorted"
+
+  : > "$raw_copy_list"
+  write_root_safe_spark_shared_classes
+  write_default_unshimmed_spark_shared_classes
+  cat "$DEFAULT_UNSHIMMED_SPARK_SHARED_TXT" >> "$raw_copy_list"
+  append_matching_spark_shared_patterns \
+    "${UNSHIMMED_COMMON_FROM_SINGLE_SHIM_TXT:-}" "$raw_copy_list"
+
+  sort -u "$raw_copy_list" > "$sorted_copy_list"
+  filter_keep_in_spark_shared "$sorted_copy_list" "$UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST"
   if [[ -s "$UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST" ]]; then
-    echo "Promoting root-layout files from spark-shared via $unshimmed_patterns_txt"
+    echo "Promoting root-layout files from spark-shared by default"
     rsync --files-from="$UNSHIMMED_FROM_SPARK_SHARED_COPY_LIST" \
       ./parallel-world/spark-shared ./parallel-world
   fi
@@ -141,9 +275,23 @@ rm -rf "$SPARK_SHARED_DIR"
 mkdir -p "$SPARK_SHARED_DIR"
 
 echo "$((++STEP))/ retaining a single copy of spark-shared classes"
-while read -r spark_common_class; do
-  retain_single_copy "$spark_common_class"
-done < "$SPARK_SHARED_TXT"
+awk -F/ "
+  NF >= 3 {
+    shim = \$2
+    package_class = \$0
+    sub(\"^/spark[34][^/]*/\", \"\", package_class)
+    print package_class >> (\"from-\" shim \"-to-spark-shared.txt\")
+  }
+" "$SPARK_SHARED_TXT"
+for pw in ./parallel-world/spark[34]* ; do
+  awk -v pw="$pw" "
+    {
+      package_class = \$0
+      sub(\"^/spark[34][^/]*/\", \"\", package_class)
+      print pw \"/\" package_class
+    }
+  " "$SPARK_SHARED_TXT"
+done >> "$DELETE_DUPLICATES_TXT"
 
 echo "$((++STEP))/ rsyncing common classes to $SPARK_SHARED_DIR"
 for copy_list in from-spark[34]*-to-spark-shared.txt; do
@@ -157,7 +305,7 @@ done
 
 mv "$SPARK_SHARED_DIR" parallel-world/
 
-echo "$((++STEP))/ promoting allowlisted spark-shared files to root layout"
+echo "$((++STEP))/ promoting default spark-shared files to root layout"
 copy_unshimmed_from_spark_shared
 
 # Verify that all class files in the conventional jar location are bitwise
@@ -184,11 +332,16 @@ copy_unshimmed_from_spark_shared
 
 # Determine the list of unshimmed class files
 UNSHIMMED_LIST_TXT=unshimmed-result.txt
-echo "$((++STEP))/ creating sorted list of unshimmed classes > $UNSHIMMED_LIST_TXT"
-find ./parallel-world -name '*.class' -not -path './parallel-world/spark[34-]*' | \
+echo "$((++STEP))/ creating sorted list of root-layout unshimmed classes > $UNSHIMMED_LIST_TXT"
+find ./parallel-world -name '*.class' \
+  -not -path './parallel-world/spark[34-]*' \
+  -not -path './parallel-world/spark-shared/*' | \
   cut -d/ -f 3- | sort > "$UNSHIMMED_LIST_TXT"
 
-function verify_same_sha_for_unshimmed() {
+echo "$((++STEP))/ creating sorted list of spark-shared classes > $SPARK_SHARED_CLASSES_TXT"
+sed -E "s|^/spark[^/]*/||" "$SPARK_SHARED_TXT" | sort -u > "$SPARK_SHARED_CLASSES_TXT"
+
+function unshimmed_class_needs_shared_identity() {
   set -e
   class_file="$1"
 
@@ -196,7 +349,7 @@ function verify_same_sha_for_unshimmed() {
   # including the ones that are unshimmed. Instead of expensively recomputing
   # sha1 look up if there is an entry with the unshimmed class as a suffix
 
-  class_file_quoted=$(printf '%q' "$class_file")
+  class_file_quoted=$(printf "%q" "$class_file")
   # TODO currently RapidsShuffleManager is "removed" from /spark* by construction in
   # dist pom.xml via ant. We could delegate this logic to this script
   # and make both simmpler
@@ -211,34 +364,72 @@ function verify_same_sha_for_unshimmed() {
   # the class provides concrete implementations for ALL getReader variants,
   # so the JVM resolves the correct one at runtime regardless of which
   # ShuffleManager version the class was compiled against.
-  if [[ ! "$class_file_quoted" =~ com/nvidia/spark/rapids/spark[34].*/.*ShuffleManager.class && \
-          "$class_file_quoted" != "com/nvidia/spark/ParquetCachedBatchSerializer.class" && \
-          ! "$class_file_quoted" =~ org/apache/spark/sql/rapids/ProxyRapidsShuffleInternalManagerBase ]]; then
-      if ! grep -q "/spark.\+/$class_file_quoted" "$SPARK_SHARED_TXT"; then
-        echo >&2 "$class_file is not bitwise-identical across shims"
-        exit 255
-      fi
+  # GpuShuffleDependency has identical JVM bytecode and descriptors between
+  # Spark 3.5 and 4.1. Only ScalaSignature metadata differs after compiling
+  # the same source against different Spark dependency jars. WindowInPandasExecTypeShim
+  # has no methods in the class shell; its companion carries the behavior.
+  # CloseableColumnBatchIterator has identical descriptors and code; Scala 2.13 only
+  # renames generic Signature-attribute type variables across the Spark 3.5/4.1 compiles.
+  # GpuReadCSVFileFormat and GpuReadJsonFileFormat have identical descriptors and
+  # executable javap output; only ScalaSignature metadata differs across Spark deps.
+  # PythonMapInArrowExecShims and PythonArgumentUtils class shells have identical
+  # executable bytecode; only source-file metadata differs across shim source names.
+  # GpuUnionExecShim and RapidsErrorUtils class shells have identical executable
+  # bytecode; only ScalaSignature metadata differs.
+  # GpuStringTrim* differs after Spark 4.1 because String2TrimExpression adds
+  # collation/context-independent foldability methods. The case-class fields,
+  # product surface, and Spark 3.5-callable methods remain compatible; Spark 3.x
+  # does not invoke the added methods.
+  # GpuAtomicCreateTableAsSelectExec companion has identical executable bytecode;
+  # only line-number debug metadata differs across shim sources.
+  if [[ "$class_file_quoted" =~ com/nvidia/spark/rapids/spark[34].*/.*ShuffleManager.class || \
+          "$class_file_quoted" == "com/nvidia/spark/ParquetCachedBatchSerializer.class" || \
+          "$class_file_quoted" =~ org/apache/spark/sql/rapids/ProxyRapidsShuffleInternalManagerBase || \
+          "$class_file_quoted" == "org/apache/spark/sql/rapids/GpuShuffleDependency.class" || \
+          "$class_file_quoted" == "com/nvidia/spark/rapids/parquet/CloseableColumnBatchIterator.class" || \
+          "$class_file_quoted" == "com/nvidia/spark/rapids/GpuReadCSVFileFormat.class" || \
+          "$class_file_quoted" == "org/apache/spark/sql/catalyst/json/rapids/GpuReadJsonFileFormat.class" || \
+          "$class_file_quoted" == "com/nvidia/spark/rapids/shims/PythonMapInArrowExecShims.class" || \
+          "$class_file_quoted" == "org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentUtils.class" || \
+          "$class_file_quoted" == "com/nvidia/spark/rapids/shims/GpuUnionExecShim.class" || \
+          "$class_file_quoted" == "org/apache/spark/sql/rapids/GpuStringTrim.class" || \
+          "$class_file_quoted" == "org/apache/spark/sql/rapids/GpuStringTrimLeft.class" || \
+          "$class_file_quoted" == "org/apache/spark/sql/rapids/GpuStringTrimRight.class" || \
+          "$class_file" == "org/apache/spark/sql/execution/datasources/v2/rapids/GpuAtomicCreateTableAsSelectExec$.class" || \
+          "$class_file_quoted" == "org/apache/spark/sql/rapids/shims/RapidsErrorUtils.class" || \
+          "$class_file_quoted" == "org/apache/spark/sql/rapids/execution/python/shims/WindowInPandasExecTypeShim.class" ]]; then
+      return 1
   fi
+  return 0
 }
 
-echo "$((++STEP))/ verifying unshimmed classes have unique sha1 across shims"
+echo "$((++STEP))/ filtering unshimmed classes that require shared identity > $UNSHIMMED_NEED_SHARED_TXT"
 while read -r unshimmed_class; do
-  verify_same_sha_for_unshimmed "$unshimmed_class"
-done < "$UNSHIMMED_LIST_TXT"
+  if unshimmed_class_needs_shared_identity "$unshimmed_class"; then
+    echo "$unshimmed_class"
+  fi
+done < "$UNSHIMMED_LIST_TXT" | sort -u > "$UNSHIMMED_NEED_SHARED_TXT"
+
+echo "$((++STEP))/ verifying unshimmed classes have unique sha1 across shims"
+comm -23 "$UNSHIMMED_NEED_SHARED_TXT" "$SPARK_SHARED_CLASSES_TXT" > "$UNSHIMMED_MISSING_SHARED_TXT"
+if [[ -s "$UNSHIMMED_MISSING_SHARED_TXT" ]]; then
+  read -r missing_unshimmed_class < "$UNSHIMMED_MISSING_SHARED_TXT"
+  echo >&2 "$missing_unshimmed_class is not bitwise-identical across shims"
+  exit 255
+fi
 
 # Remove unshimmed classes from parallel worlds
 # TODO rework with low priority, only a few classes.
 echo "$((++STEP))/ removing duplicates of unshimmed classes"
-
-while read -r unshimmed_class; do
+{
+  sed "s|^|./parallel-world/spark-shared/|" "$UNSHIMMED_LIST_TXT"
   for pw in ./parallel-world/spark[34-]* ; do
-    unshimmed_path="$pw/$unshimmed_class"
-    [[ -f "$unshimmed_path" ]] && echo "$unshimmed_path" || true
-  done >> "$DELETE_DUPLICATES_TXT"
-done < "$UNSHIMMED_LIST_TXT"
+    awk -v pw="$pw" "{ print pw \"/\" \$0 }" "$UNSHIMMED_LIST_TXT"
+  done
+} >> "$DELETE_DUPLICATES_TXT"
 
 echo "$((++STEP))/ deleting all class files listed in $DELETE_DUPLICATES_TXT"
-< "$DELETE_DUPLICATES_TXT" sort -u | xargs rm
+< "$DELETE_DUPLICATES_TXT" sort -u | xargs rm -f
 
 end_time=$(date +%s)
 echo "binary-dedupe completed in $((end_time - start_time)) seconds"
diff --git a/dist/scripts/build-unshim-parallel-world.py b/dist/scripts/build-unshim-parallel-world.py
new file mode 100644
index 00000000000..9f41be63558
--- /dev/null
+++ b/dist/scripts/build-unshim-parallel-world.py
@@ -0,0 +1,292 @@
+#!/usr/bin/env python3
+
+# Copyright (c) 2026, NVIDIA CORPORATION.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Build dist/target/parallel-world directly for repeated unshim analysis.
+
+This mirrors the analyzer-relevant part of dist/maven-antrun/build-parallel-worlds.xml
+without starting a final Maven dist generate-resources invocation. It assumes buildall
+has already built the per-shim sql-plugin-api and aggregator jars under target/sparkXYZ.
+"""
+
+import argparse
+import fnmatch
+import hashlib
+import os
+from pathlib import Path
+import shutil
+import subprocess
+import sys
+import zipfile
+
+
+ARTIFACTS = ("sql-plugin-api", "aggregator")
+
+
+def read_patterns(path):
+    with path.open() as fh:
+        return [
+            line.strip()
+            for line in fh
+            if line.strip() and not line.lstrip().startswith("#")
+        ]
+
+
+def has_fnmatch_magic(pattern):
+    return any(ch in pattern for ch in "*?[")
+
+
+def matching_members(namelist, patterns):
+    names_by_entry = {}
+    for name in namelist:
+        names_by_entry.setdefault(name, []).append(name)
+
+    matches = []
+    for pattern in patterns:
+        if has_fnmatch_magic(pattern):
+            matches.extend(fnmatch.filter(namelist, pattern))
+        else:
+            matches.extend(names_by_entry.get(pattern, []))
+    return matches
+
+
+def safe_extract(zip_handle, destination, members=None):
+    destination = destination.resolve()
+    for member in members if members is not None else zip_handle.namelist():
+        target = (destination / member).resolve()
+        if not str(target).startswith(str(destination) + os.sep):
+            raise RuntimeError("refusing to extract outside destination: %s" % member)
+        zip_handle.extract(member, destination)
+
+
+def clean_output(target_dir):
+    for dirname in ("parallel-world", "deps", "extra-resources"):
+        path = target_dir / dirname
+        if path.exists():
+            shutil.rmtree(path)
+        path.mkdir(parents=True, exist_ok=True)
+    for jar_path in target_dir.glob("*.jar"):
+        jar_path.unlink()
+
+
+def artifact_jar(base_dir, artifact, scala_binary_version, project_version, buildver):
+    artifact_id = "rapids-4-spark-%s_%s" % (artifact, scala_binary_version)
+    classifier = "spark%s" % buildver
+    jar_name = "%s-%s-%s.jar" % (artifact_id, project_version, classifier)
+    jar_path = base_dir / artifact / "target" / classifier / jar_name
+    if not jar_path.is_file():
+        raise FileNotFoundError(
+            "expected built %s jar missing: %s" % (artifact, jar_path))
+    return jar_path
+
+
+def jar_signature(jar_path):
+    stat = jar_path.stat()
+    return "\n".join((
+        "path=%s" % jar_path,
+        "size=%s" % stat.st_size,
+        "mtime_ns=%s" % stat.st_mtime_ns,
+        "",
+    ))
+
+
+def dedupe_cache_key(base_dir, scala_binary_version, project_version, buildvers):
+    parts = []
+    for buildver in sorted(buildvers, reverse=True):
+        for artifact in ARTIFACTS:
+            jar_path = artifact_jar(
+                base_dir, artifact, scala_binary_version, project_version, buildver)
+            parts.extend((
+                "buildver=%s" % buildver,
+                "artifact=%s" % artifact,
+                jar_signature(jar_path),
+            ))
+    return hashlib.sha1("\n".join(parts).encode("utf-8")).hexdigest()
+
+
+def ensure_extracted_cache(jar_path, cache_dir):
+    contents_dir = cache_dir / "contents"
+    marker = cache_dir / ".source"
+    signature = jar_signature(jar_path)
+
+    if marker.is_file() and marker.read_text() == signature:
+        return contents_dir
+
+    if cache_dir.exists():
+        shutil.rmtree(cache_dir)
+    contents_dir.mkdir(parents=True, exist_ok=True)
+    with zipfile.ZipFile(jar_path) as zip_handle:
+        safe_extract(zip_handle, contents_dir)
+    marker.write_text(signature)
+    return contents_dir
+
+
+def link_or_copy(src, dst):
+    dst.parent.mkdir(parents=True, exist_ok=True)
+    if dst.exists() or dst.is_symlink():
+        dst.unlink()
+    try:
+        os.link(src, dst)
+    except OSError:
+        shutil.copy2(src, dst)
+
+
+def link_tree_contents(src_dir, dst_dir):
+    for root, _, files in os.walk(src_dir):
+        root_path = Path(root)
+        rel_root = root_path.relative_to(src_dir)
+        target_root = dst_dir / rel_root
+        target_root.mkdir(parents=True, exist_ok=True)
+        for name in files:
+            link_or_copy(root_path / name, target_root / name)
+
+
+def link_members(contents_dir, destination, members):
+    for member in members:
+        if member.endswith("/"):
+            continue
+        src = contents_dir / member
+        if src.is_file():
+            link_or_copy(src, destination / member)
+
+
+def copy_and_extract_jars(
+        base_dir,
+        target_dir,
+        scala_binary_version,
+        project_version,
+        buildvers,
+        from_single_shim,
+        from_each):
+    parallel_world = target_dir / "parallel-world"
+    cache_root = target_dir / "unshim-parallel-world-cache"
+    sorted_buildvers = sorted(buildvers, reverse=True)
+    root_buildver = sorted_buildvers[0]
+
+    for buildver in sorted_buildvers:
+        classifier = "spark%s" % buildver
+        for artifact in ARTIFACTS:
+            jar_path = artifact_jar(
+                base_dir, artifact, scala_binary_version, project_version, buildver)
+            contents_dir = ensure_extracted_cache(
+                jar_path, cache_root / classifier / artifact)
+            with zipfile.ZipFile(jar_path) as zip_handle:
+                namelist = zip_handle.namelist()
+
+            link_tree_contents(contents_dir, parallel_world / classifier)
+            if buildver == root_buildver and artifact == "sql-plugin-api":
+                link_tree_contents(contents_dir, parallel_world)
+
+            patterns = from_each
+            if buildver == root_buildver:
+                patterns = from_single_shim + from_each
+            members = matching_members(namelist, patterns)
+            link_members(contents_dir, parallel_world, members)
+
+
+def run_checked(command, cwd, env=None):
+    subprocess.run(command, cwd=str(cwd), env=env, check=True)
+
+
+def remove_allowlisted_from_spark_shared(parallel_world, from_single_shim):
+    shared_dir = parallel_world / "spark-shared"
+    if not shared_dir.is_dir():
+        return
+
+    for pattern in from_single_shim:
+        if has_fnmatch_magic(pattern):
+            for path in shared_dir.rglob("*"):
+                if path.is_file() and fnmatch.fnmatch(path.relative_to(shared_dir).as_posix(), pattern):
+                    path.unlink()
+        else:
+            path = shared_dir / pattern
+            if path.is_file():
+                path.unlink()
+
+
+def main():
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument("--mvn-base-dir", required=True,
+        help="Maven build root containing module target directories")
+    parser.add_argument("--source-dir", required=True,
+        help="Top-level spark-rapids source directory")
+    parser.add_argument("--project-version", required=True)
+    parser.add_argument("--scala-binary-version", required=True)
+    parser.add_argument("--buildvers", required=True,
+        help="Comma-separated Spark build versions, for example 350,411")
+    parser.add_argument("--ignore-shim-revisions-check", action="store_true",
+        help="Continue when per-shim build metadata revisions differ")
+    args = parser.parse_args()
+
+    base_dir = Path(args.mvn_base_dir).resolve()
+    source_dir = Path(args.source_dir).resolve()
+    dist_dir = source_dir / "dist"
+    target_dir = base_dir / "dist" / "target"
+    parallel_world = target_dir / "parallel-world"
+    buildvers = [item.strip() for item in args.buildvers.split(",") if item.strip()]
+
+    if len(buildvers) == 0:
+        raise RuntimeError("no build versions were supplied")
+
+    from_single_shim = read_patterns(dist_dir / "unshimmed-common-from-single-shim.txt")
+    from_each = read_patterns(dist_dir / "unshimmed-from-each-spark3xx.txt")
+
+    print("Direct unshim parallel-world assembly for Spark versions: %s" %
+          ", ".join(buildvers),
+          flush=True)
+    clean_output(target_dir)
+    copy_and_extract_jars(
+        base_dir,
+        target_dir,
+        args.scala_binary_version,
+        args.project_version,
+        buildvers,
+        from_single_shim,
+        from_each)
+
+    revision_check = subprocess.run(
+        [str(dist_dir / "scripts" / "check-shims-revisions.sh"), ",".join(buildvers)],
+        cwd=str(target_dir),
+        check=False)
+    if revision_check.returncode != 0:
+        if args.ignore_shim_revisions_check:
+            print("Ignoring shim revision check failure for direct unshim parallel-world assembly",
+                  flush=True)
+        else:
+            revision_check.check_returncode()
+
+    dedupe_env = os.environ.copy()
+    dedupe_env["UNSHIM_FAST"] = "1"
+    dedupe_env["UNSHIM_DEDUPE_CACHE_DIR"] = str(
+        target_dir / "unshim-dedupe-cache" / dedupe_cache_key(
+            base_dir,
+            args.scala_binary_version,
+            args.project_version,
+            buildvers))
+    dedupe_env["UNSHIMMED_COMMON_FROM_SINGLE_SHIM_TXT"] = str(
+        dist_dir / "unshimmed-common-from-single-shim.txt")
+    dedupe_env["KEEP_IN_SPARK_SHARED_TXT"] = str(dist_dir / "keep-in-spark-shared.txt")
+    dedupe_env["UNSHIM_ANALYZER_SCRIPT"] = str(
+        dist_dir / "scripts" / "analyze-parallel-world-deps.py")
+    run_checked([str(dist_dir / "scripts" / "binary-dedupe.sh")],
+                cwd=target_dir,
+                env=dedupe_env)
+    remove_allowlisted_from_spark_shared(parallel_world, from_single_shim)
+
+    print("Direct unshim parallel-world output: %s" % parallel_world, flush=True)
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/dist/unshimmed-common-from-single-shim.txt b/dist/unshimmed-common-from-single-shim.txt
index 5802807a250..a3dc3ed0214 100644
--- a/dist/unshimmed-common-from-single-shim.txt
+++ b/dist/unshimmed-common-from-single-shim.txt
@@ -1,53 +1,9 @@
+# Files that must be promoted to the root layout from one representative shim
+# but are not selected by default class promotion. Common class files are
+# unshimmed by default when binary-dedupe proves they are bitwise-identical
+# across shims.
 META-INF/DEPENDENCIES
 META-INF/LICENSE
 META-INF/NOTICE
-com/nvidia/spark/rapids/ExplainPlan.class
-com/nvidia/spark/rapids/ExplainPlan$.class
-com/nvidia/spark/rapids/ExplainPlanBase.class
-com/nvidia/spark/rapids/Optimizer.class
-com/nvidia/spark/rapids/optimizer/SQLOptimizerPlugin*
-com/nvidia/spark/rapids/ShimLoaderTemp*
-com/nvidia/spark/rapids/SparkShims*
-com/nvidia/spark/rapids/fileio/iceberg/IcebergInputFile.class
-com/nvidia/spark/rapids/fileio/iceberg/IcebergInputStream.class
-com/nvidia/spark/rapids/fileio/iceberg/IcebergOutputFile.class
-com/nvidia/spark/rapids/fileio/iceberg/IcebergOutputStream.class
-com/nvidia/spark/rapids/iceberg/GpuInternalRow.class
-com/nvidia/spark/rapids/iceberg/GpuInternalRowBase.class
-com/nvidia/spark/rapids/iceberg/data/GpuDeleteFilter2.class
-com/nvidia/spark/rapids/iceberg/package.class
-com/nvidia/spark/rapids/iceberg/package$.class
-com/nvidia/spark/rapids/iceberg/parquet/FileSchemaAccessors.class
-com/nvidia/spark/rapids/iceberg/parquet/GpuIcebergParquetReader$.class
-com/nvidia/spark/rapids/iceberg/parquet/SingleFile.class
-com/nvidia/spark/rapids/iceberg/parquet/SingleFile$.class
-com/nvidia/spark/rapids/iceberg/parquet/ThreadConf.class
-com/nvidia/spark/rapids/iceberg/spark/GpuSparkReadOptions.class
-com/nvidia/spark/rapids/iceberg/spark/GpuSparkReadOptions$.class
-com/nvidia/spark/rapids/iceberg/spark/GpuSparkSQLProperties.class
-com/nvidia/spark/rapids/iceberg/spark/GpuSparkSQLProperties$.class
-com/nvidia/spark/rapids/iceberg/spark/GpuSparkUtil.class
-com/nvidia/spark/rapids/iceberg/spark/GpuSparkUtil$.class
-com/nvidia/spark/rapids/iceberg/spark/RapidsSparkCatalog.class
-com/nvidia/spark/rapids/iceberg/spark/RapidsSparkSessionCatalog.class
-com/nvidia/spark/rapids/iceberg/spark/source/RapidsSparkTable.class
-org/apache/iceberg/aws/s3/IcebergS3InputFileAccess.class
-org/apache/iceberg/data/GpuFileHelpers.class
-org/apache/iceberg/io/GpuClusteredWriterBridge.class
-org/apache/iceberg/io/GpuFanoutWriterBridge.class
-org/apache/iceberg/io/GpuPositionDeleteFileWriter$.class
-org/apache/iceberg/parquet/GpuParquetIOAccess.class
-org/apache/iceberg/spark/GpuTypeToSparkType.class
-org/apache/iceberg/spark/GpuTypeToSparkType$.class
-org/apache/iceberg/spark/GpuSparkReadConf.class
-org/apache/iceberg/spark/GpuSparkReadConfAccess.class
-org/apache/iceberg/spark/package.class
-org/apache/iceberg/spark/package$.class
-org/apache/iceberg/spark/source/GpuBaseReader.class
-org/apache/iceberg/spark/source/GpuSparkPlanningUtil.class
-org/apache/iceberg/spark/source/GpuSparkScanAccess.class
-org/apache/iceberg/spark/source/GpuSparkWriteAccess.class
-org/apache/iceberg/spark/source/GpuStructInternalRow.class
-org/apache/spark/sql/rapids/AdaptiveSparkPlanHelperShim*
-org/apache/spark/sql/rapids/ExecutionPlanCaptureCallback*
+rapids4spark-private-version-info.properties
 rapids/*.py
diff --git a/dist/unshimmed-from-each-spark3xx.txt b/dist/unshimmed-from-each-spark3xx.txt
index 918a572722b..1f96d9d0781 100644
--- a/dist/unshimmed-from-each-spark3xx.txt
+++ b/dist/unshimmed-from-each-spark3xx.txt
@@ -9,4 +9,6 @@ com/nvidia/spark/rapids/delta/DeltaProbe.class
 com/nvidia/spark/rapids/delta/DeltaProvider.class
 com/nvidia/spark/rapids/delta/DeltaProvider$.class
 com/nvidia/spark/rapids/PlanShims*
+org/apache/spark/sql/rapids/GpuShuffleDependency.class
+org/apache/spark/sql/rapids/execution/python/shims/WindowInPandasExecTypeShim.class
 spark-*-info.properties
diff --git a/docs/additional-functionality/rapids-udfs.md b/docs/additional-functionality/rapids-udfs.md
index d498a841ef1..e4144460f0e 100644
--- a/docs/additional-functionality/rapids-udfs.md
+++ b/docs/additional-functionality/rapids-udfs.md
@@ -152,7 +152,7 @@ The GPU support for Pandas UDF is an experimental feature, and may change at any
 ---
 
 GPU support for Pandas UDF is built on Apache Spark's [Pandas UDF(user defined
-function)](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#pandas-udfs-a-k-a-vectorized-udfs),
+function)](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#pandas-udfs-a-k-a-vectorized-udfs),
 and has two features:
 
 - **GPU Assignment(Scheduling) in Python Process**: Let the Python process share the same GPU with
@@ -201,12 +201,12 @@ Accelerator has a 1-1 mapping support for each of them.
 
   |Spark Execution Plan|Data Transfer Accelerated|Use Case|
   |----------------------|----------|--------|
-  |ArrowEvalPythonExec|yes|[Series to Series](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#series-to-series), [Iterator of Series to Iterator of Series](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#iterator-of-series-to-iterator-of-series) and [Iterator of Multiple Series to Iterator of Series](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#iterator-of-multiple-series-to-iterator-of-series)|
-  |MapInPandasExec|yes|[Map](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#map)|
-  |WindowInPandasExec|yes|[Window](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#series-to-scalar)|
-  |FlatMapGroupsInPandasExec|yes|[Grouped Map](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#grouped-map)|
-  |AggregateInPandasExec|yes|[Aggregate](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#series-to-scalar)|
-  |FlatMapCoGroupsInPandasExec|yes|[Co-grouped Map](https://archive.apache.org/dist/spark/docs/3.2.0/api/python/user_guide/sql/arrow_pandas.html#co-grouped-map)|
+  |ArrowEvalPythonExec|yes|[Series to Series](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#series-to-series), [Iterator of Series to Iterator of Series](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#iterator-of-series-to-iterator-of-series) and [Iterator of Multiple Series to Iterator of Series](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#iterator-of-multiple-series-to-iterator-of-series)|
+  |MapInPandasExec|yes|[Map](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#map)|
+  |WindowInPandasExec|yes|[Window](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#series-to-scalar)|
+  |FlatMapGroupsInPandasExec|yes|[Grouped Map](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#grouped-map)|
+  |AggregateInPandasExec|yes|[Aggregate](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#series-to-scalar)|
+  |FlatMapCoGroupsInPandasExec|yes|[Co-grouped Map](https://spark.apache.org/docs/3.5.7/api/python/user_guide/sql/arrow_pandas.html#co-grouped-map)|
 
 
 ### Other Configuration
diff --git a/docs/dev/adaptive-query.md b/docs/dev/adaptive-query.md
index c3e5568bfb4..cf9c8c126e4 100644
--- a/docs/dev/adaptive-query.md
+++ b/docs/dev/adaptive-query.md
@@ -51,7 +51,7 @@ optimizer rules:
 
 ```scala
 extensions.injectColumnar(_ => ColumnarOverrideRules())
-extensions.injectQueryStagePrepRule(_ => GpuQueryStagePrepOverrides())
+extensions.injectQueryStagePrepRule(_ => new GpuQueryStagePrepOverrides)
 ```
 
 The `ColumnarOverrideRules` are used whether AQE is enabled or not, and the
diff --git a/docs/dev/shimplify.md b/docs/dev/shimplify.md
index 4fefd824c7c..dd1f83f871d 100644
--- a/docs/dev/shimplify.md
+++ b/docs/dev/shimplify.md
@@ -266,4 +266,4 @@ See [CPD user doc][7] for more details about the options you can pass inside `cp
 [4]: https://jsonlines.org/
 [5]: https://spark.apache.org/versioning-policy.html
 [6]: https://plugins.jetbrains.com/plugin/16429-idea-resolve-symlinks
-[7]: https://docs.pmd-code.org/latest/pmd_userdocs_cpd.html
+[7]: https://pmd.github.io/pmd/pmd_userdocs_cpd.html
diff --git a/docs/dev/shims.md b/docs/dev/shims.md
index 38a368df73b..f68b5e61e81 100644
--- a/docs/dev/shims.md
+++ b/docs/dev/shims.md
@@ -22,6 +22,100 @@ class as a tight entry point for interacting with the host Spark runtime.
 
 In the following we provide recipes for typical scenarios addressed by the Shim layer.
 
+## One-way Shim Module Boundary
+
+Shim source can be split between three layers when the implementation does not have to live
+in the same module as the Spark-version-specific API reference.
+
+1. `sql-plugin-api` contains the narrow shared types that both sides can see. These types must
+   not depend on `sql-plugin` implementation classes.
+2. `sql-plugin-shims` depends on `sql-plugin-api` and Spark. It may reference Spark classes whose
+   source or binary shape varies by build version, but it must not reference implementation types
+   such as `GpuOverrides`, `RapidsMeta`, `ExprRule`, `ExecRule`, or GPU meta classes.
+3. `sql-plugin` depends on `sql-plugin-shims`. It turns API-level shim descriptors into concrete
+   plugin rules and owns the RAPIDS metadata factories.
+
+For replacement rules, use descriptor objects when the shim only needs to identify a Spark class
+and provide stable rule metadata. For example, `ShimDataWritingCommandRule`,
+`ShimRunnableCommandRule`, and `ShimExecRule` live in `sql-plugin-api`; versioned objects in
+`sql-plugin-shims` instantiate those descriptors with Spark-specific class tags; `sql-plugin`
+then calls the corresponding `GpuOverrides.*FromShim` method and supplies the actual `RapidsMeta`
+factory. This keeps the call direction one-way: shared plugin code can consume shim descriptors,
+while shim code cannot call back into shared plugin implementation.
+
+Classes whose `spark-rapids-shim-json-lines` entries cover all build versions can be unshimmed
+into a common source root when there is no special-version sibling and the source is truly
+compatible across the supported Spark APIs. When a file has Databricks-specific, Spark 4.1-specific,
+or otherwise divergent siblings, keep the version-specific source and move only the API-safe part
+behind the one-way boundary.
+
+## Reducing Parallel-World Classes
+
+The long-term goal is to maximize bytecode in the conventional jar layout and shrink the amount
+of code that must be loaded through the parallel-world mechanism. A class can move from
+`spark-shared` to the conventional layout only when it has no static dependency path to
+Spark-version-specific bytecode. The dependency path matters transitively: a `spark-shared` class
+that calls another `spark-shared` class that eventually calls a `sparkXYZ` class is not root-safe.
+
+`dist/unshimmed-common-from-single-shim.txt` names classes and resources that are allowed to be
+stored in the conventional layout after the dist jar is assembled. During `binary-dedupe.sh`, files
+from that allowlist may be promoted out of `spark-shared` into the root layout before the bitwise
+identity check runs. This is important for profiles where the highest Spark build contributes only a
+stub module, while a lower Spark build contributes the real implementation. For example, root-safe
+Iceberg helpers can still be placed in the conventional layout even when the Spark 4.1 shim uses the
+Iceberg stub.
+
+Use a small bootstrap allowlist for classes that are allowed to refer to packages generated with
+`$_spark.version.classifier_`, such as `com.nvidia.spark.rapids.spark330.RapidsShuffleManager`.
+Ordinary shared implementation classes should not have direct static dependencies on those
+classifier packages. They should instead call through stable contracts in `sql-plugin-api` or
+through descriptor objects in `sql-plugin-shims`.
+
+For an inventory of a released artifact, download the complete dist jar from Maven Central and run
+the dependency analyzer directly against the jar:
+
+```bash
+VERSION=26.04.2
+curl -fL -o /tmp/rapids-4-spark_2.12-${VERSION}-cuda12.jar \
+  https://repo.maven.apache.org/maven2/com/nvidia/rapids-4-spark_2.12/${VERSION}/rapids-4-spark_2.12-${VERSION}-cuda12.jar
+
+python3 dist/scripts/analyze-parallel-world-deps.py \
+  /tmp/rapids-4-spark_2.12-${VERSION}-cuda12.jar \
+  --show-topo
+```
+
+Run the same command for the Scala 2.13 artifact when checking Spark 4.x coverage. Internal
+snapshot artifacts can be analyzed the same way after downloading a timestamped dist jar from the
+configured artifact repository; keep repository credentials in local Maven or environment
+configuration rather than embedding them in scripts or docs.
+
+For local branch validation, build representative two-shim dist jars that span the widest
+differences in each Scala line:
+
+```bash
+./build/buildall --profile=350,411 --scala213 --module=dist
+python3 dist/scripts/analyze-parallel-world-deps.py \
+  scala2.13/dist/target/parallel-world \
+  --show-topo
+
+./build/buildall --profile=330,358 --module=dist
+python3 dist/scripts/analyze-parallel-world-deps.py \
+  dist/target/parallel-world \
+  --show-topo
+```
+
+The analyzer reports:
+
+1. direct classifier-package dependencies, which should remain limited to bootstrap/facade code;
+2. root or `spark-shared` classes with transitive paths to version-specific classes;
+3. root-safe `spark-shared` strongly connected components in dependency-first order.
+
+Use `--format=json` when comparing safe components across artifacts or build outputs. JSON output
+keeps counts exact and bounds example sections with `--limit`.
+Shortest paths explain why a class is blocked and usually identify the adapter boundary to cut.
+Strongly connected components, not shortest paths, provide the migration ordering because classes in
+the same component have to move or be refactored together.
+
 ## Method signature discrepancies
 
 It's among the easiest issues to resolve. We define a method in SparkShims
diff --git a/iceberg/common/src/main/java/org/apache/iceberg/spark/source/GpuSparkWriteAccess.java b/iceberg/common/src/main/java/org/apache/iceberg/spark/source/GpuSparkWriteAccess.java
index 91ed87280da..8e3f7b55a51 100644
--- a/iceberg/common/src/main/java/org/apache/iceberg/spark/source/GpuSparkWriteAccess.java
+++ b/iceberg/common/src/main/java/org/apache/iceberg/spark/source/GpuSparkWriteAccess.java
@@ -17,11 +17,14 @@
 package org.apache.iceberg.spark.source;
 
 import java.lang.reflect.Field;
+import java.lang.reflect.InvocationTargetException;
+import java.lang.reflect.Method;
 import java.util.Map;
 
 import org.apache.iceberg.DataFile;
 import org.apache.iceberg.FileFormat;
 import org.apache.iceberg.Schema;
+import org.apache.iceberg.SnapshotUpdate;
 import org.apache.iceberg.Table;
 import org.apache.iceberg.deletes.DeleteGranularity;
 import org.apache.iceberg.io.DeleteWriteResult;
@@ -94,6 +97,23 @@ public static Map<String, String> writeProperties(Write write) {
     return readField(sparkWrite(write), "writeProperties", Map.class);
   }
 
+  public static void abort(Write write, WriterCommitMessage[] messages) {
+    invokeMethod(
+        sparkWrite(write),
+        "abort",
+        new Class<?>[] {WriterCommitMessage[].class},
+        new Object[] {messages});
+  }
+
+  public static void commitOperation(
+      Write write, SnapshotUpdate<?> operation, String description) {
+    invokeMethod(
+        sparkWrite(write),
+        "commitOperation",
+        new Class<?>[] {SnapshotUpdate.class, String.class},
+        new Object[] {operation, description});
+  }
+
   public static Table table(DeltaWrite write) {
     return readField(positionDeltaWrite(write), "table", Table.class);
   }
@@ -169,6 +189,10 @@ public static WriterCommitMessage taskCommit(DataFile[] files) {
     return commit;
   }
 
+  public static DataFile[] taskCommitFiles(WriterCommitMessage message) {
+    return ((SparkWrite.TaskCommit) message).files();
+  }
+
   public static WriterCommitMessage deltaTaskCommit(WriteResult result) {
     return new SparkPositionDeltaWrite.DeltaTaskCommit(result);
   }
@@ -208,4 +232,38 @@ private static Field findField(Class<?> targetClass, String fieldName) {
     throw new IllegalStateException("No field " + fieldName + " in " + targetClass.getName());
   }
 
+  private static void invokeMethod(
+      Object target, String methodName, Class<?>[] parameterTypes, Object[] args) {
+    try {
+      Method method = findMethod(target.getClass(), methodName, parameterTypes);
+      method.setAccessible(true);
+      method.invoke(target, args);
+    } catch (IllegalAccessException e) {
+      throw new IllegalStateException(
+          "Unable to invoke " + methodName + " on " + target.getClass().getName(), e);
+    } catch (InvocationTargetException e) {
+      Throwable cause = e.getCause();
+      if (cause instanceof RuntimeException) {
+        throw (RuntimeException) cause;
+      }
+      if (cause instanceof Error) {
+        throw (Error) cause;
+      }
+      throw new IllegalStateException(
+          "Unable to invoke " + methodName + " on " + target.getClass().getName(), cause);
+    }
+  }
+
+  private static Method findMethod(
+      Class<?> targetClass, String methodName, Class<?>[] parameterTypes) {
+    Class<?> current = targetClass;
+    while (current != null) {
+      try {
+        return current.getDeclaredMethod(methodName, parameterTypes);
+      } catch (NoSuchMethodException e) {
+        current = current.getSuperclass();
+      }
+    }
+    throw new IllegalStateException("No method " + methodName + " in " + targetClass.getName());
+  }
 }
diff --git a/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/GpuIcebergPartitioner.scala b/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/GpuIcebergPartitioner.scala
index a93e77533ed..0887ea7281d 100644
--- a/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/GpuIcebergPartitioner.scala
+++ b/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/GpuIcebergPartitioner.scala
@@ -98,7 +98,7 @@ class GpuIcebergPartitioner(
 
           // Combine the partition keys and partitioned tables
           partitionKeys.zip(partitions).map { case (partKey, partition) =>
-            ColumnarBatchWithPartition(SpillableColumnarBatch(partition,
+            new ColumnarBatchWithPartition(SpillableColumnarBatch(partition,
               valueSparkType,
               SpillPriorities.ACTIVE_BATCHING_PRIORITY),
               partKey)
@@ -178,8 +178,9 @@ class GpuIcebergSpecPartitioner(val spec: PartitionSpec,
   }
 }
 
-case class ColumnarBatchWithPartition(batch: SpillableColumnarBatch, partition: StructLike) extends
-  AutoCloseable {
+class ColumnarBatchWithPartition(
+    val batch: SpillableColumnarBatch,
+    val partition: StructLike) extends AutoCloseable {
   override def close(): Unit = {
     batch.close()
   }
diff --git a/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/parquet/GpuCoalescingIcebergParquetReader.scala b/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/parquet/GpuCoalescingIcebergParquetReader.scala
index 56ab66a20ee..2df18a7d7fd 100644
--- a/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/parquet/GpuCoalescingIcebergParquetReader.scala
+++ b/iceberg/common/src/main/scala/com/nvidia/spark/rapids/iceberg/parquet/GpuCoalescingIcebergParquetReader.scala
@@ -68,11 +68,11 @@ class GpuCoalescingIcebergParquetReader(
             conf.metrics)
 
           info.blocks.map { block =>
-            ParquetSingleDataBlockMeta(
+            new ParquetSingleDataBlockMeta(
               info.filePath,
-              ParquetDataBlock(block, CpuCompressionConfig.disabled()),
+              new ParquetDataBlock(block, CpuCompressionConfig.disabled()),
               InternalRow.empty,
-              ParquetSchemaWrapper(info.schema),
+              new ParquetSchemaWrapper(info.schema),
               info.readSchema,
               IcebergParquetExtraInfo(
                 info.dateRebaseMode,
diff --git a/iceberg/common/src/main/scala/org/apache/iceberg/spark/functions/transforms.scala b/iceberg/common/src/main/scala/org/apache/iceberg/spark/functions/transforms.scala
index 33b68811d79..f1674fc618a 100644
--- a/iceberg/common/src/main/scala/org/apache/iceberg/spark/functions/transforms.scala
+++ b/iceberg/common/src/main/scala/org/apache/iceberg/spark/functions/transforms.scala
@@ -98,7 +98,7 @@ object GpuTransform {
   }
 }
 
-case class GpuFieldTransform(sourceFieldId: Int, transform: GpuTransform) {
+class GpuFieldTransform(val sourceFieldId: Int, val transform: GpuTransform) {
   def supports(inputType: StructType, inputSchema: Schema): Boolean = {
     // Iceberg allows partition source fields to reference nested-leaf field ids
     // (e.g. `bucket(4, contact.email)`). Those ids do not appear in
diff --git a/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuReaderFactory.scala b/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuReaderFactory.scala
index 0efbee1da56..4e9b2a6ec6d 100644
--- a/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuReaderFactory.scala
+++ b/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuReaderFactory.scala
@@ -108,7 +108,7 @@ class GpuReaderFactory(private val metrics: Map[String, GpuMetric],
           queryUsesInputFile || hasFilePathMetadata || hasRowPositionMetadata ||
             !hasNoDeletes
         MultiThread(poolConfBuilder, partition.maxNumParquetFilesParallel,
-          CombineConf(combineThresholdSize, combineWaitTime),
+          new CombineConf(combineThresholdSize, combineWaitTime),
           disableCombining,
           hasFilePathMetadata,
           hasRowPositionMetadata)
diff --git a/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkPositionDeltaWrite.scala b/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkPositionDeltaWrite.scala
index ce146a6522f..6eabbbee6e4 100644
--- a/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkPositionDeltaWrite.scala
+++ b/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkPositionDeltaWrite.scala
@@ -347,7 +347,7 @@ trait GpuDeltaWriter extends DeltaWriter[ColumnarBatch] {
   protected def newDeleteWriteContext(metadata: ColumnarBatch, rowId: ColumnarBatch)
   : DeleteWriteContext = {
     withResource(Seq(metadata, rowId)) { _ =>
-      var ret = DeleteWriteContext(spillPartValues = SpillableColumnarBatch(
+      var ret = new DeleteWriteContext(spillPartValues = SpillableColumnarBatch(
         extractToStruct(metadata, context.partitionOrdinal()),
         ACTIVE_ON_DECK_PRIORITY))
 
@@ -371,17 +371,22 @@ trait GpuDeltaWriter extends DeltaWriter[ColumnarBatch] {
   }
 }
 
-case class DeleteWriteContext(
-  spillPartValues: SpillableColumnarBatch = null,
-  spillPosDeletes: SpillableColumnarBatch = null,
-  uniqueSpecIdCol: RapidsHostColumnVector = null,
-  specIdCol: CudfColumnVector = null) extends AutoCloseable {
+class DeleteWriteContext(
+  val spillPartValues: SpillableColumnarBatch = null,
+  val spillPosDeletes: SpillableColumnarBatch = null,
+  val uniqueSpecIdCol: RapidsHostColumnVector = null,
+  val specIdCol: CudfColumnVector = null) extends AutoCloseable {
+
+  def copy(
+      spillPartValues: SpillableColumnarBatch = this.spillPartValues,
+      spillPosDeletes: SpillableColumnarBatch = this.spillPosDeletes,
+      uniqueSpecIdCol: RapidsHostColumnVector = this.uniqueSpecIdCol,
+      specIdCol: CudfColumnVector = this.specIdCol): DeleteWriteContext = {
+    new DeleteWriteContext(spillPartValues, spillPosDeletes, uniqueSpecIdCol, specIdCol)
+  }
 
   override def close(): Unit = {
-    productIterator
-      .map(_.asInstanceOf[AutoCloseable])
-      .toSeq
-      .safeClose()
+    Seq[AutoCloseable](spillPartValues, spillPosDeletes, uniqueSpecIdCol, specIdCol).safeClose()
   }
 }
 
@@ -480,7 +485,7 @@ trait GpuDeleteAndDataDeltaWriter extends GpuDeltaWriter {
                     }
                   } else {
                     // Unpartitioned spec
-                    Seq(ColumnarBatchWithPartition(
+                    Seq(new ColumnarBatchWithPartition(
                       SpillableColumnarBatch(filteredPositionDeletes,
                         SpillPriorities.ACTIVE_ON_DECK_PRIORITY),
                       emptyPartitionData
@@ -601,7 +606,7 @@ class GpuDeleteOnlyDeltaWriter(
                     }
                   } else {
                     // Unpartitioned spec
-                    Seq(ColumnarBatchWithPartition(
+                    Seq(new ColumnarBatchWithPartition(
                       SpillableColumnarBatch(filteredPositionDeletes,
                         SpillPriorities.ACTIVE_ON_DECK_PRIORITY),
                       emptyPartitionData
diff --git a/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkWrite.scala b/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkWrite.scala
index 5628ce311db..ad76c489b20 100644
--- a/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkWrite.scala
+++ b/iceberg/common/src/main/scala/org/apache/iceberg/spark/source/GpuSparkWrite.scala
@@ -86,6 +86,10 @@ class GpuSparkWrite(cpu: Write) extends GpuWrite with RequiresDistributionAndOrd
 
   override def toString: String = s"GpuIcebergWrite(table=$table, format=$format)"
 
+  private[source] def abort(messages: Array[WriterCommitMessage]): Unit = {
+    GpuSparkWriteAccess.abort(cpu, messages)
+  }
+
   override def distributionStrictlyRequired(): Boolean =
     writeRequirements.distributionStrictlyRequired()
 
@@ -95,7 +99,6 @@ class GpuSparkWrite(cpu: Write) extends GpuWrite with RequiresDistributionAndOrd
     writeRequirements.advisoryPartitionSizeInBytes()
 
   override def requiredDistribution(): Distribution = writeRequirements.requiredDistribution()
-
   override def requiredOrdering(): Array[SortOrder] = writeRequirements.requiredOrdering()
 
   private[source] def createDataWriterFactory: DataWriterFactory = {
@@ -154,6 +157,16 @@ class GpuSparkWrite(cpu: Write) extends GpuWrite with RequiresDistributionAndOrd
       statsTracker,
       serializedHadoopConf)
   }
+
+  private[source] def files(messages: Array[WriterCommitMessage]): Seq[DataFile] = {
+    messages.filter(_ != null)
+      .flatMap(GpuSparkWriteAccess.taskCommitFiles)
+      .toSeq
+  }
+
+  private[source] def commitOperation(operation: SnapshotUpdate[_], desc: String) = {
+    GpuSparkWriteAccess.commitOperation(cpu, operation, desc)
+  }
 }
 
 object GpuSparkWrite {
@@ -250,7 +263,7 @@ object GpuSparkWrite {
         val transform = partitionField.transform()
         GpuTransform.tryFrom(transform) match {
           case Success(t) =>
-            val fieldTransform = GpuFieldTransform(partitionField.sourceId(), t)
+            val fieldTransform = new GpuFieldTransform(partitionField.sourceId(), t)
             if (!fieldTransform.supports(dataSparkType.get, dataSchema.get)) {
               meta.willNotWorkOnGpu(
                 s"Iceberg partition transform $transform is not supported on GPU")
diff --git a/integration_tests/src/main/python/delta_lake_test.py b/integration_tests/src/main/python/delta_lake_test.py
index 80afd59d5bf..4b6f46864d2 100644
--- a/integration_tests/src/main/python/delta_lake_test.py
+++ b/integration_tests/src/main/python/delta_lake_test.py
@@ -599,7 +599,7 @@ def test_delta_deletion_vector_interleaved_file_splits(
     """
     Tests deletion vector handling when files are interleaved in a way that causes their
     blocks to be split non-consecutively.
-    
+
     For this test, we set up two files A (large) and B (small) such that:
       - A is split into N PartitionedFiles: [max, ..., max, tail].
       - tail(A) < len(B) < max_split.
diff --git a/integration_tests/src/main/python/iceberg/iceberg_append_test.py b/integration_tests/src/main/python/iceberg/iceberg_append_test.py
index 152c5fe1377..c7223cd51db 100644
--- a/integration_tests/src/main/python/iceberg/iceberg_append_test.py
+++ b/integration_tests/src/main/python/iceberg/iceberg_append_test.py
@@ -494,4 +494,3 @@ def insert_data(spark):
         return spark.sql(f"INSERT INTO {table_name} SELECT * FROM {view_name}")
 
     assert_gpu_fallback_collect(insert_data, "AppendDataExec", conf=iceberg_write_enabled_conf)
-
diff --git a/pom.xml b/pom.xml
index 450211bcc4a..df560199c9b 100644
--- a/pom.xml
+++ b/pom.xml
@@ -67,8 +67,12 @@
         <module>dist</module>
         <module>integration_tests</module>
         <module>shuffle-plugin</module>
-        <module>sql-plugin</module>
         <module>sql-plugin-api</module>
+        <module>sql-plugin-format</module>
+        <module>sql-plugin-fileio</module>
+        <module>sql-plugin-columnar</module>
+        <module>sql-plugin-shims</module>
+        <module>sql-plugin</module>
         <module>tests</module>
         <module>tools</module>
         <module>udf-compiler</module>
@@ -805,6 +809,8 @@
         <rapids.module>.</rapids.module>
         <rapids.secondaryCacheDir>${spark.rapids.project.basedir}/target/${spark.version.classifier}/.sbt/1.0/zinc/org.scala-sbt</rapids.secondaryCacheDir>
         <allowConventionalDistJar>false</allowConventionalDistJar>
+        <rapids.shimplify.skip>false</rapids.shimplify.skip>
+        <rapids.build.info.skip>false</rapids.build.info.skip>
         <buildver>330</buildver>
         <maven.compiler.source>1.8</maven.compiler.source>
         <java.major.version>8</java.major.version>
@@ -1191,6 +1197,7 @@
                         <goals><goal>run</goal></goals>
                         <phase>generate-sources</phase>
                         <configuration>
+                            <skip>${rapids.shimplify.skip}</skip>
                             <target xmlns:ac="antlib:net.sf.antcontrib">
                                 <property name="dyn.shim.buildver" value="all.buildvers"/>
                                 <script language="jython" src="${spark.rapids.source.basedir}/build/dyn_shim_detection.py"/>
@@ -1216,6 +1223,7 @@
                         <id>generate-build-info</id>
                         <phase>generate-resources</phase>
                         <configuration>
+                            <skip>${rapids.build.info.skip}</skip>
                             <!-- Execute the shell script to generate the plugin build information. -->
                             <target name="build-info">
                                 <taskdef resource="net/sf/antcontrib/antcontrib.properties"/>
diff --git a/scala2.13/aggregator/pom.xml b/scala2.13/aggregator/pom.xml
index a6fb5f60651..d538fba4254 100644
--- a/scala2.13/aggregator/pom.xml
+++ b/scala2.13/aggregator/pom.xml
@@ -45,6 +45,7 @@
         <!-- Maven to register attached artifact , which we later replace -->
         <rapids.shim.jar.phase>initialize</rapids.shim.jar.phase>
         <rapids.source.jar.phase>none</rapids.source.jar.phase>
+        <rapids.aggregator.downstream.refresh.skip>false</rapids.aggregator.downstream.refresh.skip>
     </properties>
     <dependencies>
         <dependency>
@@ -196,6 +197,7 @@
                         <goals><goal>run</goal></goals>
                         <phase>process-classes</phase>
                         <configuration>
+                            <skip>${rapids.aggregator.downstream.refresh.skip}</skip>
                             <target>
                                 <taskdef resource="net/sf/antcontrib/antcontrib.properties"/>
                                 <property name="realAggJar"
diff --git a/scala2.13/pom.xml b/scala2.13/pom.xml
index 6b9a9aa8d68..7a414c746ea 100644
--- a/scala2.13/pom.xml
+++ b/scala2.13/pom.xml
@@ -67,8 +67,12 @@
         <module>dist</module>
         <module>integration_tests</module>
         <module>shuffle-plugin</module>
-        <module>sql-plugin</module>
         <module>sql-plugin-api</module>
+        <module>sql-plugin-format</module>
+        <module>sql-plugin-fileio</module>
+        <module>sql-plugin-columnar</module>
+        <module>sql-plugin-shims</module>
+        <module>sql-plugin</module>
         <module>tests</module>
         <module>tools</module>
         <module>udf-compiler</module>
@@ -805,6 +809,8 @@
         <rapids.module>.</rapids.module>
         <rapids.secondaryCacheDir>${spark.rapids.project.basedir}/target/${spark.version.classifier}/.sbt/1.0/zinc/org.scala-sbt</rapids.secondaryCacheDir>
         <allowConventionalDistJar>false</allowConventionalDistJar>
+        <rapids.shimplify.skip>false</rapids.shimplify.skip>
+        <rapids.build.info.skip>false</rapids.build.info.skip>
         <buildver>330</buildver>
         <maven.compiler.source>1.8</maven.compiler.source>
         <java.major.version>8</java.major.version>
@@ -1191,6 +1197,7 @@
                         <goals><goal>run</goal></goals>
                         <phase>generate-sources</phase>
                         <configuration>
+                            <skip>${rapids.shimplify.skip}</skip>
                             <target xmlns:ac="antlib:net.sf.antcontrib">
                                 <property name="dyn.shim.buildver" value="all.buildvers"/>
                                 <script language="jython" src="${spark.rapids.source.basedir}/build/dyn_shim_detection.py"/>
@@ -1216,6 +1223,7 @@
                         <id>generate-build-info</id>
                         <phase>generate-resources</phase>
                         <configuration>
+                            <skip>${rapids.build.info.skip}</skip>
                             <!-- Execute the shell script to generate the plugin build information. -->
                             <target name="build-info">
                                 <taskdef resource="net/sf/antcontrib/antcontrib.properties"/>
diff --git a/scala2.13/shuffle-plugin/pom.xml b/scala2.13/shuffle-plugin/pom.xml
index 191036cb1c0..ca29953086d 100644
--- a/scala2.13/shuffle-plugin/pom.xml
+++ b/scala2.13/shuffle-plugin/pom.xml
@@ -42,6 +42,12 @@
             <artifactId>spark-rapids-jni</artifactId>
             <classifier>${jni.classifier}</classifier>
         </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-api_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
         <dependency>
             <groupId>org.scala-lang</groupId>
             <artifactId>scala-library</artifactId>
diff --git a/scala2.13/sql-plugin-columnar/pom.xml b/scala2.13/sql-plugin-columnar/pom.xml
new file mode 100644
index 00000000000..ced1a674ea2
--- /dev/null
+++ b/scala2.13/sql-plugin-columnar/pom.xml
@@ -0,0 +1,124 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.13</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+
+    <artifactId>rapids-4-spark-sql-plugin-columnar_2.13</artifactId>
+    <description>Java-only columnar runtime plumbing for the RAPIDS SQL plugin</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-columnar</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+        <rapids.shimplify.skip>true</rapids.shimplify.skip>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>spark-rapids-jni</artifactId>
+            <classifier>${jni.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-format_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-sql_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>provided</scope>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>default-compile</id>
+                        <phase>compile</phase>
+                        <goals>
+                            <goal>compile</goal>
+                        </goals>
+                    </execution>
+                    <execution>
+                        <id>default-testCompile</id>
+                        <phase>test-compile</phase>
+                        <goals>
+                            <goal>testCompile</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <release>${java.major.version}</release>
+                    <compilerArgs>
+                        <arg>-Xlint:all,-serial,-path,-try,-processing</arg>
+                    </compilerArgs>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>eclipse-add-source</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-test-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>attach-scaladocs</id>
+                        <phase>none</phase>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <configuration>
+                    <skipTests>true</skipTests>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/scala2.13/sql-plugin-fileio/pom.xml b/scala2.13/sql-plugin-fileio/pom.xml
new file mode 100644
index 00000000000..6c9a666e8bb
--- /dev/null
+++ b/scala2.13/sql-plugin-fileio/pom.xml
@@ -0,0 +1,118 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.13</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+
+    <artifactId>rapids-4-spark-sql-plugin-fileio_2.13</artifactId>
+    <description>Java-only file I/O runtime plumbing for the RAPIDS SQL plugin</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-fileio</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+        <rapids.shimplify.skip>true</rapids.shimplify.skip>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>spark-rapids-jni</artifactId>
+            <classifier>${jni.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-core_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>provided</scope>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>default-compile</id>
+                        <phase>compile</phase>
+                        <goals>
+                            <goal>compile</goal>
+                        </goals>
+                    </execution>
+                    <execution>
+                        <id>default-testCompile</id>
+                        <phase>test-compile</phase>
+                        <goals>
+                            <goal>testCompile</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <release>${java.major.version}</release>
+                    <compilerArgs>
+                        <arg>-Xlint:all,-serial,-path,-try,-processing</arg>
+                    </compilerArgs>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>eclipse-add-source</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-test-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>attach-scaladocs</id>
+                        <phase>none</phase>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <configuration>
+                    <skipTests>true</skipTests>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/scala2.13/sql-plugin-format/pom.xml b/scala2.13/sql-plugin-format/pom.xml
new file mode 100644
index 00000000000..471656fe973
--- /dev/null
+++ b/scala2.13/sql-plugin-format/pom.xml
@@ -0,0 +1,111 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.13</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+
+    <artifactId>rapids-4-spark-sql-plugin-format_2.13</artifactId>
+    <description>Java-only FlatBuffers format classes for the RAPIDS SQL plugin</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-format</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+        <rapids.shimplify.skip>true</rapids.shimplify.skip>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.google.flatbuffers</groupId>
+            <artifactId>flatbuffers-java</artifactId>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>default-compile</id>
+                        <phase>compile</phase>
+                        <goals>
+                            <goal>compile</goal>
+                        </goals>
+                    </execution>
+                    <execution>
+                        <id>default-testCompile</id>
+                        <phase>test-compile</phase>
+                        <goals>
+                            <goal>testCompile</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <release>${java.major.version}</release>
+                    <compilerArgs>
+                        <arg>-Xlint:all,-serial,-path,-try,-processing</arg>
+                    </compilerArgs>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>eclipse-add-source</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-test-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>attach-scaladocs</id>
+                        <phase>none</phase>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <configuration>
+                    <skipTests>true</skipTests>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/scala2.13/sql-plugin-shims/pom.xml b/scala2.13/sql-plugin-shims/pom.xml
new file mode 100644
index 00000000000..db47aac3d38
--- /dev/null
+++ b/scala2.13/sql-plugin-shims/pom.xml
@@ -0,0 +1,68 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.13</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+    <artifactId>rapids-4-spark-sql-shims_2.13</artifactId>
+    <name>RAPIDS Accelerator for Apache Spark SQL Plugin Shims</name>
+    <description>Compile-time isolated SQL plugin shims</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-shims</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-api_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>org.scala-lang</groupId>
+            <artifactId>scala-library</artifactId>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <artifactId>maven-antrun-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/scala2.13/sql-plugin/pom.xml b/scala2.13/sql-plugin/pom.xml
index 14efec5aea3..6b0925787f8 100644
--- a/scala2.13/sql-plugin/pom.xml
+++ b/scala2.13/sql-plugin/pom.xml
@@ -54,12 +54,37 @@
             <version>${spark-rapids-private.version}</version>
             <classifier>${spark.version.classifier}</classifier>
         </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-format_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-fileio_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-columnar_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
         <dependency>
             <groupId>com.nvidia</groupId>
             <artifactId>rapids-4-spark-sql-plugin-api_${scala.binary.version}</artifactId>
             <version>${project.version}</version>
             <classifier>${spark.version.classifier}</classifier>
         </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-shims_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+            <scope>provided</scope>
+        </dependency>
         <dependency>
             <groupId>org.scala-lang</groupId>
             <artifactId>scala-library</artifactId>
@@ -219,6 +244,27 @@
                 <groupId>net.alchim31.maven</groupId>
                 <artifactId>scala-maven-plugin</artifactId>
             </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-dependency-plugin</artifactId>
+                <version>3.6.1</version>
+                <executions>
+                    <execution>
+                        <id>unpack-sql-plugin-shims</id>
+                        <phase>prepare-package</phase>
+                        <goals>
+                            <goal>unpack-dependencies</goal>
+                        </goals>
+                        <configuration>
+                            <includeGroupIds>com.nvidia</includeGroupIds>
+                            <includeArtifactIds>rapids-4-spark-sql-shims_${scala.binary.version}</includeArtifactIds>
+                            <excludeTransitive>true</excludeTransitive>
+                            <includes>**/*.class</includes>
+                            <outputDirectory>${project.build.outputDirectory}</outputDirectory>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
             <plugin>
                 <groupId>org.apache.rat</groupId>
                 <artifactId>apache-rat-plugin</artifactId>
diff --git a/shuffle-plugin/pom.xml b/shuffle-plugin/pom.xml
index ff481d52819..e1148736125 100644
--- a/shuffle-plugin/pom.xml
+++ b/shuffle-plugin/pom.xml
@@ -42,6 +42,12 @@
             <artifactId>spark-rapids-jni</artifactId>
             <classifier>${jni.classifier}</classifier>
         </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-api_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
         <dependency>
             <groupId>org.scala-lang</groupId>
             <artifactId>scala-library</artifactId>
diff --git a/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/Rkeys.java b/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/Rkeys.java
new file mode 100644
index 00000000000..2882b1db81d
--- /dev/null
+++ b/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/Rkeys.java
@@ -0,0 +1,57 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.shuffle.ucx;
+
+import java.nio.ByteBuffer;
+import java.util.Objects;
+
+import scala.collection.Seq;
+
+/** UCX remote keys registered for a peer. */
+public final class Rkeys {
+  private final Seq<ByteBuffer> rkeys;
+
+  public Rkeys(Seq<ByteBuffer> rkeys) {
+    this.rkeys = rkeys;
+  }
+
+  public Seq<ByteBuffer> rkeys() {
+    return rkeys;
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof Rkeys)) {
+      return false;
+    }
+    Rkeys other = (Rkeys) obj;
+    return Objects.equals(rkeys, other.rkeys);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(rkeys);
+  }
+
+  @Override
+  public String toString() {
+    return "Rkeys(" + rkeys + ")";
+  }
+}
diff --git a/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/UCXActiveMessage.java b/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/UCXActiveMessage.java
new file mode 100644
index 00000000000..cb1622c3adb
--- /dev/null
+++ b/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/UCXActiveMessage.java
@@ -0,0 +1,69 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.shuffle.ucx;
+
+import java.util.Objects;
+
+/** Active message id and dynamic header used by UCX request/response handlers. */
+public final class UCXActiveMessage {
+  private final int activeMessageId;
+  private final long header;
+  private final boolean forceRndv;
+
+  public UCXActiveMessage(int activeMessageId, long header, boolean forceRndv) {
+    this.activeMessageId = activeMessageId;
+    this.header = header;
+    this.forceRndv = forceRndv;
+  }
+
+  public int activeMessageId() {
+    return activeMessageId;
+  }
+
+  public long header() {
+    return header;
+  }
+
+  public boolean forceRndv() {
+    return forceRndv;
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof UCXActiveMessage)) {
+      return false;
+    }
+    UCXActiveMessage other = (UCXActiveMessage) obj;
+    return activeMessageId == other.activeMessageId &&
+        header == other.header &&
+        forceRndv == other.forceRndv;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(activeMessageId, header, forceRndv);
+  }
+
+  @Override
+  public String toString() {
+    return "[amId=" + String.format("0x%08X", activeMessageId) +
+        ", hdr=" + String.format("0x%016X", header) + "]";
+  }
+}
diff --git a/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/UCXError.java b/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/UCXError.java
new file mode 100644
index 00000000000..48526126a9d
--- /dev/null
+++ b/shuffle-plugin/src/main/java/com/nvidia/spark/rapids/shuffle/ucx/UCXError.java
@@ -0,0 +1,61 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.shuffle.ucx;
+
+import java.util.Objects;
+
+/** Error reported by UCX. */
+public final class UCXError {
+  private final int ucsStatus;
+  private final String errorMsg;
+
+  public UCXError(int ucsStatus, String errorMsg) {
+    this.ucsStatus = ucsStatus;
+    this.errorMsg = errorMsg;
+  }
+
+  public int ucsStatus() {
+    return ucsStatus;
+  }
+
+  public String errorMsg() {
+    return errorMsg;
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof UCXError)) {
+      return false;
+    }
+    UCXError other = (UCXError) obj;
+    return ucsStatus == other.ucsStatus &&
+        Objects.equals(errorMsg, other.errorMsg);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(ucsStatus, errorMsg);
+  }
+
+  @Override
+  public String toString() {
+    return "UCXError(" + ucsStatus + "," + errorMsg + ")";
+  }
+}
diff --git a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCX.scala b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCX.scala
index 6a8336f2a4a..9f6d87f1e50 100644
--- a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCX.scala
+++ b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCX.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -40,22 +40,6 @@ import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.storage.RapidsStorageUtils
 import org.apache.spark.storage.BlockManagerId
 
-case class Rkeys(rkeys: Seq[ByteBuffer])
-
-/**
- * A simple wrapper for an Active Message Id and a header. This pair
- * is used together when dealing with Active Messages, with `activeMessageId`
- * being a fire-and-forget registration with UCX, and `header` being a dynamic long
- * we continue to update (it contains the local executor id, and the transaction id).
- *
- * This allows us to send a request (with a header that the response handler knows about),
- * and for the request handler to echo back that header when it's done.
- */
-case class UCXActiveMessage(activeMessageId: Int, header: Long, forceRndv: Boolean) {
-  override def toString: String =
-    UCX.formatAmIdAndHeader(activeMessageId, header)
-}
-
 /**
  * The UCX class wraps JUCX classes and handles all communication with UCX from other
  * parts of the shuffle code. It manages a `UcpContext` and `UcpWorker`, for the
@@ -427,7 +411,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
               s"Received message with wrong header size $headerSize")
           } else {
             val header = UcxUtils.getByteBufferView(headerAddr, headerSize).getLong()
-            val am = UCXActiveMessage(reg.activeMessageId, header, reg.useRndv)
+            val am = new UCXActiveMessage(reg.activeMessageId, header, reg.useRndv)
 
             withResource(new NvtxRange("AM Receive", NvtxColor.YELLOW)) { _ =>
               logDebug(s"Active Message received: $am")
@@ -448,7 +432,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
                     cb.onSuccess(am, mtb)
                   case _ =>
                     cb.onError(am,
-                      UCXError(0, "Received an eager message for non-metadata message"))
+                      new UCXError(0, "Received an eager message for non-metadata message"))
                 })
 
                 // we return OK telling UCX `amData` is ok to be closed, along with the eagerly
@@ -475,7 +459,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
                                     s" status=$ucsStatus, msg=$errorMsg")
                                 cb.onCancel(am)
                               } else {
-                                cb.onError(am, UCXError(ucsStatus, errorMsg))
+                                cb.onError(am, new UCXError(ucsStatus, errorMsg))
                               }
                             }
                           }
@@ -833,7 +817,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
         s"for ${connectionRequest.getClientAddress}")
 
       // Register a `Control` active message for a handshake response
-      val responseAm = UCXActiveMessage(
+      val responseAm = new UCXActiveMessage(
         UCXConnection.composeResponseAmId(MessageType.Control), ep.getNativeId, false)
 
       registerResponseHandler(responseAm, new UCXAmCallback {
@@ -918,7 +902,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
       if (reverseLookupEndpoints.containsKey(ucpEndpoint)) {
         val executorId = reverseLookupEndpoints.get(ucpEndpoint)
         if (!isShuttingDown) {
-          val error = UCXError(errorCode, errorString)
+          val error = new UCXError(errorCode, errorString)
           logError(s"UcpListener detected an error for executorId $executorId: " +
             s"$error")
         }
@@ -1036,7 +1020,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
 
     // called from progress thread - on ConnectionRequest
     private def sendControlRequest(ep: UcpEndpoint, responseAm: UCXActiveMessage): Unit = {
-      val requestAm = UCXActiveMessage(
+      val requestAm = new UCXActiveMessage(
         UCXConnection.composeRequestAmId(MessageType.Control), ep.getNativeId, false)
 
       val handshakeMsg =
@@ -1048,7 +1032,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
           TransportUtils.getAddress(handshakeMsg), handshakeMsg.remaining(),
           new UcxCallback {
             override def onError(ucsStatus: Int, errorMsg: String): Unit = {
-              val error = UCXError(ucsStatus, errorMsg)
+              val error = new UCXError(ucsStatus, errorMsg)
               logError(s"Error sending handshake header, " +
                 s"error: $error active message: $requestAm handshake: $handshakeMsg")
               RapidsStorageUtils.dispose(handshakeMsg)
@@ -1071,7 +1055,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
       // reply
       val handshakeMsg = UCXConnection.packHandshake(localExecutorId, localRkeys)
       val responseAmId = UCXConnection.composeResponseAmId(MessageType.Control)
-      val responseAm = UCXActiveMessage(responseAmId, requestAm.header, false)
+      val responseAm = new UCXActiveMessage(responseAmId, requestAm.header, false)
       val address = TransportUtils.getAddress(handshakeMsg)
       val len = handshakeMsg.remaining()
 
@@ -1080,7 +1064,7 @@ class UCX(transport: UCXShuffleTransport, executor: BlockManagerId, rapidsConf:
         sendActiveMessage(ep, responseAm, address, len,
           new UcxCallback {
             override def onError(ucsStatus: Int, errorMsg: String): Unit = {
-              val error = UCXError(ucsStatus, errorMsg)
+              val error = new UCXError(ucsStatus, errorMsg)
               logError(s"Error replying to sending handshake header, " +
                 s"error: $error active message: $responseAm")
               RapidsStorageUtils.dispose(handshakeMsg)
diff --git a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXConnection.scala b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXConnection.scala
index f6966df02a8..5464ff6a507 100644
--- a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXConnection.scala
+++ b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXConnection.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -16,7 +16,7 @@
 
 package com.nvidia.spark.rapids.shuffle.ucx
 
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 import java.util.concurrent.ConcurrentHashMap
 
 import ai.rapids.cudf.MemoryBuffer
@@ -30,7 +30,6 @@ import org.apache.spark.internal.Logging
  * These are private apis used within the ucx package.
  */
 
-case class UCXError(ucsStatus: Int, errorMsg: String)
 
 /**
  * `UCXAmCallback` is used by [[Transaction]] to handle UCX Active Messages operations.
@@ -94,8 +93,8 @@ class UCXServerConnection(ucx: UCX, transport: UCXShuffleTransport)
     logDebug(s"Sending to ${peerExecutorId} at ${TransportUtils.toHex(header)} " +
       s"with ${buffer}")
 
-    val sendAm = UCXActiveMessage(UCXConnection.composeSendAmId(messageType),
-      header, forceRndv = true)
+    val sendAm = new UCXActiveMessage(UCXConnection.composeSendAmId(messageType),
+      header, true)
 
     ucx.sendActiveMessage(peerExecutorId, sendAm, buffer,
       new UcxCallback {
@@ -123,7 +122,7 @@ class UCXServerConnection(ucx: UCX, transport: UCXShuffleTransport)
     logDebug(s"Responding to ${peerExecutorId} at ${TransportUtils.toHex(header)} " +
       s"with ${response}")
 
-    val responseAm = UCXActiveMessage(
+    val responseAm = new UCXActiveMessage(
       UCXConnection.composeResponseAmId(messageType), header, false)
     ucx.sendActiveMessage(peerExecutorId, responseAm, response,
       new UcxCallback {
@@ -191,12 +190,12 @@ class UCXClientConnection(peerExecutorId: Long, ucx: UCX, transport: UCXShuffleT
     // Register the active message response handler. Note that the `requestHeader`
     // is expected to come back with the response, and is used to find the
     // correct callback (this is an implementation detail in UCX.scala)
-    val responseAm = UCXActiveMessage(
+    val responseAm = new UCXActiveMessage(
       UCXConnection.composeResponseAmId(messageType), requestHeader, false)
     ucx.registerResponseHandler(responseAm, amCallback)
 
     // kick-off the request
-    val requestAm = UCXActiveMessage(
+    val requestAm = new UCXActiveMessage(
       UCXConnection.composeRequestAmId(messageType), requestHeader, false)
 
     logDebug(s"Performing a ${messageType} request of size ${request.remaining()} " +
@@ -285,7 +284,7 @@ class UCXConnection(peerExecutorId: Long, val ucx: UCX) extends Logging {
   }
 }
 
-object UCXConnection extends Logging {
+object UCXConnection {
   /**
    * 1) client gets upper 28 bits
    * 2) then comes the type, which gets 4 bits
@@ -389,8 +388,8 @@ object UCXConnection extends Logging {
     val rkeys = (0 until numRkeys).map { _ =>
       val rkeySize = buff.getInt
       val rkeySlice = buff.slice()
-      rkeySlice.limit(rkeySize)
-      buff.position(buff.position() + rkeySize)
+      rkeySlice.asInstanceOf[Buffer].limit(rkeySize)
+      buff.asInstanceOf[Buffer].position(buff.position() + rkeySize)
       rkeySlice
     }
     (remoteExecutorId, rkeys)
@@ -419,7 +418,7 @@ object UCXConnection extends Logging {
       hsBuff.putInt(rkey.capacity)
       hsBuff.put(rkey)
     }
-    hsBuff.flip()
+    hsBuff.asInstanceOf[Buffer].flip()
     hsBuff
   }
 }
diff --git a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXShuffleTransport.scala b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXShuffleTransport.scala
index 3a71fd769e7..6406fa44aaf 100644
--- a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXShuffleTransport.scala
+++ b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXShuffleTransport.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -180,10 +180,10 @@ class UCXShuffleTransport(shuffleServerId: BlockManagerId, rapidsConf: RapidsCon
       val hostBuffer = tryAcquireBounceBuffers(hostSendBuffMgr, numBuffs)
       if (hostBuffer.nonEmpty) {
         deviceBuffer.zip(hostBuffer).map { case (d, h) =>
-          SendBounceBuffers(d, Some(h))
+          new SendBounceBuffers(d, Some(h))
         }
       } else {
-        deviceBuffer.map(d => SendBounceBuffers(d, None))
+        deviceBuffer.map(d => new SendBounceBuffers(d, None))
       }
     } else {
       Seq.empty
@@ -377,8 +377,8 @@ class UCXShuffleTransport(shuffleServerId: BlockManagerId, rapidsConf: RapidsCon
     }
   }
 
-  private case class ClientAndBufferReceiveState(client: RapidsShuffleClient,
-                                                 brs: BufferReceiveState)
+  private class ClientAndBufferReceiveState(val client: RapidsShuffleClient,
+                                                 val brs: BufferReceiveState)
   private val pendingBrs = new ConcurrentHashMap[Long, ClientAndBufferReceiveState]()
 
   def handleBufferReceive(size: Long, header: Long,
@@ -498,7 +498,7 @@ class UCXShuffleTransport(shuffleServerId: BlockManagerId, rapidsConf: RapidsCon
                 perClientRequests.bounceBuffer,
                 perClientRequests.transferRequests.toSeq,
                 () => bufferReceiveStateComplete(brsId))
-              pendingBrs.put(brs.id, ClientAndBufferReceiveState(client, brs))
+              pendingBrs.put(brs.id, new ClientAndBufferReceiveState(client, brs))
               client.issueBufferReceives(brs)
             }
           } else if (!hasBounceBuffers) {
diff --git a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXTransaction.scala b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXTransaction.scala
index db7cee1a87e..24feebcef16 100644
--- a/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXTransaction.scala
+++ b/shuffle-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/ucx/UCXTransaction.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -280,7 +280,7 @@ private[ucx] class UCXTransaction(conn: UCXConnection, val txId: Long)
     val diff: Double = (end - start)/1000000.0D
     val sendThroughput: Double = (sendSize.get()/1024.0D/1024.0D/1024.0D) / (diff / 1000.0D)
     val recvThroughput: Double = (receiveSize.get()/1024.0D/1024.0D/1024.0D) / (diff / 1000.0D)
-    TransactionStats(diff, sendSize.get(), receiveSize.get(), sendThroughput, recvThroughput)
+    new TransactionStats(diff, sendSize.get(), receiveSize.get(), sendThroughput, recvThroughput)
   }
 
   var callbackCalled: Boolean = false
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/HashedPriorityQueue.java b/sql-plugin-api/src/main/java/com/nvidia/spark/rapids/HashedPriorityQueue.java
similarity index 100%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/HashedPriorityQueue.java
rename to sql-plugin-api/src/main/java/com/nvidia/spark/rapids/HashedPriorityQueue.java
diff --git a/sql-plugin-api/src/main/java/com/nvidia/spark/rapids/ThreadFactoryBuilder.java b/sql-plugin-api/src/main/java/com/nvidia/spark/rapids/ThreadFactoryBuilder.java
new file mode 100644
index 00000000000..19cf340c167
--- /dev/null
+++ b/sql-plugin-api/src/main/java/com/nvidia/spark/rapids/ThreadFactoryBuilder.java
@@ -0,0 +1,60 @@
+/*
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.concurrent.Executors;
+import java.util.concurrent.ThreadFactory;
+import java.util.concurrent.atomic.AtomicLong;
+
+/**
+ * This is similar to Guava ThreadFactoryBuilder. Avoid using Guava as it is a messy dependency
+ * in practice.
+ */
+public class ThreadFactoryBuilder {
+  private String nameFormat;
+  private Boolean daemon;
+
+  public ThreadFactoryBuilder setNameFormat(String nameFormat) {
+    String.format(nameFormat, 0);
+    this.nameFormat = nameFormat;
+    return this;
+  }
+
+  public ThreadFactoryBuilder setDaemon(boolean daemon) {
+    this.daemon = daemon;
+    return this;
+  }
+
+  public ThreadFactory build() {
+    AtomicLong count = nameFormat == null ? null : new AtomicLong(0);
+    return new ThreadFactory() {
+      private final ThreadFactory defaultThreadFactory = Executors.defaultThreadFactory();
+
+      @Override
+      public Thread newThread(Runnable runnable) {
+        Thread thread = defaultThreadFactory.newThread(runnable);
+        if (nameFormat != null) {
+          thread.setName(String.format(nameFormat, count.getAndIncrement()));
+        }
+        if (daemon != null) {
+          thread.setDaemon(daemon);
+        }
+        return thread;
+      }
+    };
+  }
+}
diff --git a/sql-plugin-api/src/main/scala/com/nvidia/spark/rapids/ShimCommandRules.scala b/sql-plugin-api/src/main/scala/com/nvidia/spark/rapids/ShimCommandRules.scala
new file mode 100644
index 00000000000..f402b69d749
--- /dev/null
+++ b/sql-plugin-api/src/main/scala/com/nvidia/spark/rapids/ShimCommandRules.scala
@@ -0,0 +1,58 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids
+
+import scala.reflect.ClassTag
+
+import org.apache.spark.sql.execution.SparkPlan
+import org.apache.spark.sql.execution.command.{DataWritingCommand, RunnableCommand}
+
+final class ShimExecRule[INPUT <: SparkPlan] private (
+    val desc: String,
+    val tag: ClassTag[INPUT])
+
+object ShimExecRule {
+  def apply[INPUT <: SparkPlan](desc: String)(
+      implicit tag: ClassTag[INPUT]): ShimExecRule[INPUT] = {
+    require(desc != null)
+    new ShimExecRule[INPUT](desc, tag)
+  }
+}
+
+final class ShimDataWritingCommandRule[INPUT <: DataWritingCommand] private (
+    val desc: String,
+    val tag: ClassTag[INPUT])
+
+object ShimDataWritingCommandRule {
+  def apply[INPUT <: DataWritingCommand](desc: String)(
+      implicit tag: ClassTag[INPUT]): ShimDataWritingCommandRule[INPUT] = {
+    require(desc != null)
+    new ShimDataWritingCommandRule[INPUT](desc, tag)
+  }
+}
+
+final class ShimRunnableCommandRule[INPUT <: RunnableCommand] private (
+    val desc: String,
+    val tag: ClassTag[INPUT])
+
+object ShimRunnableCommandRule {
+  def apply[INPUT <: RunnableCommand](desc: String)(
+      implicit tag: ClassTag[INPUT]): ShimRunnableCommandRule[INPUT] = {
+    require(desc != null)
+    new ShimRunnableCommandRule[INPUT](desc, tag)
+  }
+}
diff --git a/sql-plugin-columnar/pom.xml b/sql-plugin-columnar/pom.xml
new file mode 100644
index 00000000000..c1bed4d032d
--- /dev/null
+++ b/sql-plugin-columnar/pom.xml
@@ -0,0 +1,124 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.12</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+
+    <artifactId>rapids-4-spark-sql-plugin-columnar_2.12</artifactId>
+    <description>Java-only columnar runtime plumbing for the RAPIDS SQL plugin</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-columnar</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+        <rapids.shimplify.skip>true</rapids.shimplify.skip>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>spark-rapids-jni</artifactId>
+            <classifier>${jni.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-format_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-sql_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>provided</scope>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>default-compile</id>
+                        <phase>compile</phase>
+                        <goals>
+                            <goal>compile</goal>
+                        </goals>
+                    </execution>
+                    <execution>
+                        <id>default-testCompile</id>
+                        <phase>test-compile</phase>
+                        <goals>
+                            <goal>testCompile</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <release>${java.major.version}</release>
+                    <compilerArgs>
+                        <arg>-Xlint:all,-serial,-path,-try,-processing</arg>
+                    </compilerArgs>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>eclipse-add-source</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-test-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>attach-scaladocs</id>
+                        <phase>none</phase>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <configuration>
+                    <skipTests>true</skipTests>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AbstractHostByteBufferIterator.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AbstractHostByteBufferIterator.java
new file mode 100644
index 00000000000..99a03734d90
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AbstractHostByteBufferIterator.java
@@ -0,0 +1,46 @@
+/*
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.nio.ByteBuffer;
+
+import scala.collection.AbstractIterator;
+
+public abstract class AbstractHostByteBufferIterator extends AbstractIterator<ByteBuffer> {
+  private long nextBufferStart = 0L;
+
+  public abstract long totalLength();
+
+  public long limit() {
+    return Integer.MAX_VALUE;
+  }
+
+  public abstract ByteBuffer getByteBuffer(long offset, long length);
+
+  @Override
+  public boolean hasNext() {
+    return nextBufferStart < totalLength();
+  }
+
+  @Override
+  public ByteBuffer next() {
+    long offset = nextBufferStart;
+    long length = Math.min(totalLength() - nextBufferStart, limit());
+    nextBufferStart += length;
+    return getByteBuffer(offset, length);
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AggregateModeInfo.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AggregateModeInfo.java
new file mode 100644
index 00000000000..80834a02f5c
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AggregateModeInfo.java
@@ -0,0 +1,111 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+import org.apache.spark.sql.catalyst.expressions.aggregate.AggregateMode;
+import org.apache.spark.sql.catalyst.expressions.aggregate.Complete$;
+import org.apache.spark.sql.catalyst.expressions.aggregate.Final$;
+import org.apache.spark.sql.catalyst.expressions.aggregate.Partial$;
+import org.apache.spark.sql.catalyst.expressions.aggregate.PartialMerge$;
+
+import scala.collection.Seq;
+
+/**
+ * Information on the aggregation modes being used.
+ */
+public class AggregateModeInfo implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private final Seq<AggregateMode> uniqueModes;
+  private final boolean hasPartialMode;
+  private final boolean hasPartialMergeMode;
+  private final boolean hasFinalMode;
+  private final boolean hasCompleteMode;
+
+  public AggregateModeInfo(
+      Seq<AggregateMode> uniqueModes,
+      boolean hasPartialMode,
+      boolean hasPartialMergeMode,
+      boolean hasFinalMode,
+      boolean hasCompleteMode) {
+    this.uniqueModes = uniqueModes;
+    this.hasPartialMode = hasPartialMode;
+    this.hasPartialMergeMode = hasPartialMergeMode;
+    this.hasFinalMode = hasFinalMode;
+    this.hasCompleteMode = hasCompleteMode;
+  }
+
+  public static AggregateModeInfo from(Seq<AggregateMode> uniqueModes) {
+    return new AggregateModeInfo(
+        uniqueModes,
+        uniqueModes.contains(Partial$.MODULE$),
+        uniqueModes.contains(PartialMerge$.MODULE$),
+        uniqueModes.contains(Final$.MODULE$),
+        uniqueModes.contains(Complete$.MODULE$));
+  }
+
+  public Seq<AggregateMode> uniqueModes() {
+    return uniqueModes;
+  }
+
+  public boolean hasPartialMode() {
+    return hasPartialMode;
+  }
+
+  public boolean hasPartialMergeMode() {
+    return hasPartialMergeMode;
+  }
+
+  public boolean hasFinalMode() {
+    return hasFinalMode;
+  }
+
+  public boolean hasCompleteMode() {
+    return hasCompleteMode;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof AggregateModeInfo)) {
+      return false;
+    }
+    AggregateModeInfo that = (AggregateModeInfo) other;
+    return hasPartialMode == that.hasPartialMode
+        && hasPartialMergeMode == that.hasPartialMergeMode
+        && hasFinalMode == that.hasFinalMode
+        && hasCompleteMode == that.hasCompleteMode
+        && Objects.equals(uniqueModes, that.uniqueModes);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(
+        uniqueModes, hasPartialMode, hasPartialMergeMode, hasFinalMode, hasCompleteMode);
+  }
+
+  @Override
+  public String toString() {
+    return "AggregateModeInfo(" + uniqueModes + "," + hasPartialMode + ","
+        + hasPartialMergeMode + "," + hasFinalMode + "," + hasCompleteMode + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ArrayIndexUtils.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ArrayIndexUtils.java
new file mode 100644
index 00000000000..cab1ecfced3
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ArrayIndexUtils.java
@@ -0,0 +1,72 @@
+/*
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import ai.rapids.cudf.ColumnVector;
+import ai.rapids.cudf.ColumnView;
+import ai.rapids.cudf.HostColumnVector;
+import ai.rapids.cudf.Table;
+
+public final class ArrayIndexUtils {
+  private ArrayIndexUtils() {}
+
+  public static final class IndexAndNumElement {
+    private final int index;
+    private final int numElements;
+
+    IndexAndNumElement(int index, int numElements) {
+      this.index = index;
+      this.numElements = numElements;
+    }
+
+    public int getIndex() {
+      return index;
+    }
+
+    public int getNumElements() {
+      return numElements;
+    }
+  }
+
+  /**
+   * Return the first int value (should be valid) in {@code indices} and
+   * {@code numElements} where the corresponding row in {@code mask} is true.
+   * Null rows in {@code mask} are skipped.
+   *
+   * <p>{@code indices} and {@code numElements} should be int columns with the
+   * same row count. {@code mask} should be a boolean column with the same row
+   * count. Otherwise, behavior is undefined.
+   */
+  public static IndexAndNumElement firstIndexAndNumElementUnchecked(
+      ColumnView mask, ColumnVector indices, ColumnVector numElements) {
+    try (Table indexTable = new Table(indices, numElements);
+         Table filteredTable = indexTable.filter(mask)) {
+      assert filteredTable.getRowCount() > 0;
+      int index;
+      try (HostColumnVector indicesH = filteredTable.getColumn(0).copyToHost()) {
+        assert !indicesH.isNull(0);
+        index = indicesH.getInt(0);
+      }
+      int numElement;
+      try (HostColumnVector numElemsH = filteredTable.getColumn(1).copyToHost()) {
+        assert !numElemsH.isNull(0);
+        numElement = numElemsH.getInt(0);
+      }
+      return new IndexAndNumElement(index, numElement);
+    }
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AutoCloseableTargetSize.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AutoCloseableTargetSize.java
new file mode 100644
index 00000000000..db294308c4f
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/AutoCloseableTargetSize.java
@@ -0,0 +1,78 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+public class AutoCloseableTargetSize implements AutoCloseable, Serializable {
+  private static final long serialVersionUID = 1L;
+
+  public final long targetSize;
+  public final long minSize;
+  public final long dataSize;
+
+  public AutoCloseableTargetSize(long targetSize, long minSize) {
+    this(targetSize, minSize, 0);
+  }
+
+  public AutoCloseableTargetSize(long targetSize, long minSize, long dataSize) {
+    this.targetSize = targetSize;
+    this.minSize = minSize;
+    this.dataSize = dataSize;
+  }
+
+  public long targetSize() {
+    return targetSize;
+  }
+
+  public long minSize() {
+    return minSize;
+  }
+
+  public long dataSize() {
+    return dataSize;
+  }
+
+  @Override
+  public void close() {
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof AutoCloseableTargetSize)) {
+      return false;
+    }
+    AutoCloseableTargetSize that = (AutoCloseableTargetSize) other;
+    return targetSize == that.targetSize &&
+        minSize == that.minSize &&
+        dataSize == that.dataSize;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(targetSize, minSize, dataSize);
+  }
+
+  @Override
+  public String toString() {
+    return "AutoCloseableTargetSize(" + targetSize + "," + minSize + "," + dataSize + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/BlockInfo.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/BlockInfo.java
new file mode 100644
index 00000000000..300d8026f18
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/BlockInfo.java
@@ -0,0 +1,78 @@
+/*
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+/** Avro block metadata. */
+public final class BlockInfo implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private final long blockStart;
+  private final long blockSize;
+  private final long dataSize;
+  private final long count;
+
+  public BlockInfo(long blockStart, long blockSize, long dataSize, long count) {
+    this.blockStart = blockStart;
+    this.blockSize = blockSize;
+    this.dataSize = dataSize;
+    this.count = count;
+  }
+
+  public long blockStart() {
+    return blockStart;
+  }
+
+  public long blockSize() {
+    return blockSize;
+  }
+
+  public long dataSize() {
+    return dataSize;
+  }
+
+  public long count() {
+    return count;
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof BlockInfo)) {
+      return false;
+    }
+    BlockInfo other = (BlockInfo) obj;
+    return blockStart == other.blockStart &&
+        blockSize == other.blockSize &&
+        dataSize == other.dataSize &&
+        count == other.count;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(blockStart, blockSize, dataSize, count);
+  }
+
+  @Override
+  public String toString() {
+    return "BlockInfo(" + blockStart + "," + blockSize + "," + dataSize + "," + count + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/BoolUtils.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/BoolUtils.java
new file mode 100644
index 00000000000..d02a83c77b1
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/BoolUtils.java
@@ -0,0 +1,64 @@
+/*
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import ai.rapids.cudf.ColumnVector;
+import ai.rapids.cudf.DType;
+import ai.rapids.cudf.Scalar;
+
+public final class BoolUtils {
+  private BoolUtils() {}
+
+  /**
+   * Whether all the valid rows in {@code col} are true. An empty column will get true.
+   * Null rows are skipped.
+   */
+  public static boolean isAllValidTrue(ColumnVector col) {
+    assert DType.BOOL8 == col.getType() : "input column type is not bool";
+    if (col.getRowCount() == 0) {
+      return true;
+    }
+
+    if (col.getRowCount() == col.getNullCount()) {
+      // all is null, equal to empty, since nulls should be skipped.
+      return true;
+    }
+    try (Scalar allTrue = col.all()) {
+      // Guaranteed there is at least one row and not all of the rows are null,
+      // so result scalar must be valid.
+      return allTrue.getBoolean();
+    }
+  }
+
+  /**
+   * Whether there is any valid row in {@code col} and it is true. An empty column will get false.
+   * Null rows are skipped.
+   */
+  public static boolean isAnyValidTrue(ColumnVector col) {
+    assert DType.BOOL8 == col.getType() : "input column type is not bool";
+
+    if (col.getRowCount() == col.getNullCount()) {
+      // all is null, return false since nulls should be skipped.
+      return false;
+    }
+    try (Scalar anyTrue = col.any()) {
+      // Guaranteed there is at least one row and not all of the rows are null,
+      // so result scalar must be valid.
+      return anyTrue.getBoolean();
+    }
+  }
+}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ColumnViewUtils.scala b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ColumnViewUtils.java
similarity index 56%
rename from sql-plugin/src/main/scala/com/nvidia/spark/rapids/ColumnViewUtils.scala
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ColumnViewUtils.java
index 8bea6481220..84e643d3c1f 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ColumnViewUtils.scala
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ColumnViewUtils.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -13,22 +13,25 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-package com.nvidia.spark.rapids
 
-import ai.rapids.cudf.ColumnView
-import com.nvidia.spark.rapids.Arm.withResource
+package com.nvidia.spark.rapids;
+
+import ai.rapids.cudf.ColumnView;
+import ai.rapids.cudf.Scalar;
+
+public final class ColumnViewUtils {
+  private ColumnViewUtils() {}
 
-object ColumnViewUtils {
   /**
-   * Get the `toString` on the scalar element at the specified row index in a column view.
+   * Get the {@code toString} on the scalar element at the specified row index in a column view.
    * E.g., returns: Scalar{type=INT32 value=-1250858453} (ID: 143 7149580cdd60)
    */
-  def getElementStringFromColumnView(cv: ColumnView, rowIndex: Int): String = {
-    withResource(cv.getScalarElement(rowIndex)) { scalar =>
-      if (scalar.isValid) {
-        scalar.toString
+  public static String getElementStringFromColumnView(ColumnView cv, int rowIndex) {
+    try (Scalar scalar = cv.getScalarElement(rowIndex)) {
+      if (scalar.isValid()) {
+        return scalar.toString();
       } else {
-        "null"
+        return "null";
       }
     }
   }
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/ColumnarCopyHelper.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ColumnarCopyHelper.java
similarity index 100%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/ColumnarCopyHelper.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ColumnarCopyHelper.java
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/CombineConf.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/CombineConf.java
new file mode 100644
index 00000000000..1bb19bc9261
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/CombineConf.java
@@ -0,0 +1,63 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+public class CombineConf implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private final long combineThresholdSize;
+  private final int combineWaitTime;
+
+  public CombineConf(long combineThresholdSize, int combineWaitTime) {
+    this.combineThresholdSize = combineThresholdSize;
+    this.combineWaitTime = combineWaitTime;
+  }
+
+  public long combineThresholdSize() {
+    return combineThresholdSize;
+  }
+
+  public int combineWaitTime() {
+    return combineWaitTime;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof CombineConf)) {
+      return false;
+    }
+    CombineConf that = (CombineConf) other;
+    return combineThresholdSize == that.combineThresholdSize &&
+        combineWaitTime == that.combineWaitTime;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(combineThresholdSize, combineWaitTime);
+  }
+
+  @Override
+  public String toString() {
+    return "CombineConf(" + combineThresholdSize + "," + combineWaitTime + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/CompressedTable.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/CompressedTable.java
new file mode 100644
index 00000000000..06c410d0c8c
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/CompressedTable.java
@@ -0,0 +1,78 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+import ai.rapids.cudf.DeviceMemoryBuffer;
+import com.nvidia.spark.rapids.format.TableMeta;
+
+/**
+ * Compressed table descriptor.
+ */
+public class CompressedTable implements AutoCloseable {
+  public final long compressedSize;
+  public final TableMeta meta;
+  public final DeviceMemoryBuffer buffer;
+
+  public CompressedTable(long compressedSize, TableMeta meta, DeviceMemoryBuffer buffer) {
+    this.compressedSize = compressedSize;
+    this.meta = meta;
+    this.buffer = buffer;
+  }
+
+  public long compressedSize() {
+    return compressedSize;
+  }
+
+  public TableMeta meta() {
+    return meta;
+  }
+
+  public DeviceMemoryBuffer buffer() {
+    return buffer;
+  }
+
+  @Override
+  public void close() {
+    buffer.close();
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof CompressedTable)) {
+      return false;
+    }
+    CompressedTable that = (CompressedTable) other;
+    return compressedSize == that.compressedSize &&
+        Objects.equals(meta, that.meta) &&
+        Objects.equals(buffer, that.buffer);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(compressedSize, meta, buffer);
+  }
+
+  @Override
+  public String toString() {
+    return "CompressedTable(" + compressedSize + "," + meta + "," + buffer + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DecimalUtil.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DecimalUtil.java
new file mode 100644
index 00000000000..5dc43a5678c
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DecimalUtil.java
@@ -0,0 +1,89 @@
+/*
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import ai.rapids.cudf.ColumnVector;
+import ai.rapids.cudf.ColumnView;
+import ai.rapids.cudf.DType;
+import ai.rapids.cudf.DecimalUtils;
+
+import org.apache.spark.sql.types.BooleanType;
+import org.apache.spark.sql.types.ByteType;
+import org.apache.spark.sql.types.DataType;
+import org.apache.spark.sql.types.DataTypes;
+import org.apache.spark.sql.types.Decimal;
+import org.apache.spark.sql.types.DecimalType;
+import org.apache.spark.sql.types.IntegerType;
+import org.apache.spark.sql.types.LongType;
+import org.apache.spark.sql.types.ShortType;
+
+import scala.Option;
+
+public final class DecimalUtil {
+  private static final DecimalType BOOLEAN_DECIMAL = DataTypes.createDecimalType(1, 0);
+
+  private DecimalUtil() {}
+
+  public static DType createCudfDecimal(DecimalType dt) {
+    return DecimalUtils.createDecimalType(dt.precision(), dt.scale());
+  }
+
+  public static ColumnVector outOfBounds(ColumnView input, DecimalType to) {
+    return DecimalUtils.outOfBounds(input, to.precision(), to.scale());
+  }
+
+  /**
+   * Return the size in bytes of the fixed-width data types.
+   * WARNING: Do not use this method for variable-width data types.
+   */
+  public static int getDataTypeSize(DataType dt) {
+    if (dt instanceof DecimalType && ((DecimalType) dt).precision() <= Decimal.MAX_INT_DIGITS()) {
+      return 4;
+    }
+    return dt.defaultSize();
+  }
+
+  public static Option<DecimalType> optionallyAsDecimalType(DataType t) {
+    if (t instanceof DecimalType) {
+      return Option.apply((DecimalType) t);
+    } else if (t instanceof ByteType) {
+      return decimalTypeFor(DType.INT8);
+    } else if (t instanceof ShortType) {
+      return decimalTypeFor(DType.INT16);
+    } else if (t instanceof IntegerType) {
+      return decimalTypeFor(DType.INT32);
+    } else if (t instanceof LongType) {
+      return decimalTypeFor(DType.INT64);
+    } else if (t instanceof BooleanType) {
+      return Option.apply(BOOLEAN_DECIMAL);
+    }
+    return Option.empty();
+  }
+
+  public static DecimalType asDecimalType(DataType t) {
+    Option<DecimalType> dt = optionallyAsDecimalType(t);
+    if (dt.isDefined()) {
+      return dt.get();
+    }
+    throw new IllegalArgumentException(
+        "Internal Error: type " + t + " cannot automatically be cast to a supported DecimalType");
+  }
+
+  private static Option<DecimalType> decimalTypeFor(DType dtype) {
+    return Option.apply(DataTypes.createDecimalType(dtype.getPrecisionForInt(), 0));
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DefaultThreadPoolConf.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DefaultThreadPoolConf.java
new file mode 100644
index 00000000000..c42edeb8405
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DefaultThreadPoolConf.java
@@ -0,0 +1,64 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+public class DefaultThreadPoolConf implements ThreadPoolConf {
+  private static final long serialVersionUID = 1L;
+
+  private final int maxThreadNumber;
+  private final boolean stageLevelPool;
+
+  public DefaultThreadPoolConf(int maxThreadNumber, boolean stageLevelPool) {
+    this.maxThreadNumber = maxThreadNumber;
+    this.stageLevelPool = stageLevelPool;
+  }
+
+  @Override
+  public int maxThreadNumber() {
+    return maxThreadNumber;
+  }
+
+  @Override
+  public boolean stageLevelPool() {
+    return stageLevelPool;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof DefaultThreadPoolConf)) {
+      return false;
+    }
+    DefaultThreadPoolConf that = (DefaultThreadPoolConf) other;
+    return maxThreadNumber == that.maxThreadNumber &&
+        stageLevelPool == that.stageLevelPool;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(maxThreadNumber, stageLevelPool);
+  }
+
+  @Override
+  public String toString() {
+    return "DefaultThreadPoolConf(" + maxThreadNumber + "," + stageLevelPool + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DeviceBuffersUtils.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DeviceBuffersUtils.java
new file mode 100644
index 00000000000..0e855219887
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/DeviceBuffersUtils.java
@@ -0,0 +1,78 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import ai.rapids.cudf.BaseDeviceMemoryBuffer;
+import ai.rapids.cudf.DeviceMemoryBuffer;
+
+public final class DeviceBuffersUtils {
+  private DeviceBuffersUtils() {}
+
+  public static BaseDeviceMemoryBuffer[] incRefCount(BaseDeviceMemoryBuffer[] bufs) {
+    BaseDeviceMemoryBuffer[] ret = new BaseDeviceMemoryBuffer[bufs.length];
+    int initialized = 0;
+    try {
+      for (BaseDeviceMemoryBuffer buf : bufs) {
+        buf.incRefCount();
+        ret[initialized] = buf;
+        initialized++;
+      }
+      return ret;
+    } catch (Throwable t) {
+      closeAll(ret, initialized, t);
+      throw t;
+    }
+  }
+
+  public static DeviceMemoryBuffer[] allocateBuffers(long[] bufSizes) {
+    DeviceMemoryBuffer[] ret = new DeviceMemoryBuffer[bufSizes.length];
+    int initialized = 0;
+    try (DeviceMemoryBuffer singleBuf = DeviceMemoryBuffer.allocate(sum(bufSizes))) {
+      long curPos = 0L;
+      for (long len : bufSizes) {
+        ret[initialized] = singleBuf.slice(curPos, len);
+        initialized++;
+        curPos += len;
+      }
+      return ret;
+    } catch (Throwable t) {
+      closeAll(ret, initialized, t);
+      throw t;
+    }
+  }
+
+  private static long sum(long[] values) {
+    long ret = 0L;
+    for (long value : values) {
+      ret += value;
+    }
+    return ret;
+  }
+
+  private static void closeAll(AutoCloseable[] values, int count, Throwable cause) {
+    for (int i = 0; i < count; i++) {
+      AutoCloseable value = values[i];
+      if (value != null) {
+        try {
+          value.close();
+        } catch (Throwable t) {
+          cause.addSuppressed(t);
+        }
+      }
+    }
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ExecutorCache.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ExecutorCache.java
new file mode 100644
index 00000000000..d2dba3fef99
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ExecutorCache.java
@@ -0,0 +1,55 @@
+/*
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.lang.management.ManagementFactory;
+
+import ai.rapids.cudf.Cuda;
+import ai.rapids.cudf.CudaComputeMode;
+
+/**
+ * Caches executor-related information. Values are initialized lazily to match the previous Scala
+ * object semantics.
+ */
+final class ExecutorCache {
+  private ExecutorCache() {
+  }
+
+  static CudaComputeMode getCurrentDeviceComputeMode() {
+    return CurrentDeviceComputeModeHolder.VALUE;
+  }
+
+  static byte[] getCurrentDeviceUuid() {
+    return CurrentDeviceUuidHolder.VALUE;
+  }
+
+  static String getProcessName() {
+    return ProcessNameHolder.VALUE;
+  }
+
+  private static final class CurrentDeviceComputeModeHolder {
+    private static final CudaComputeMode VALUE = Cuda.getComputeMode();
+  }
+
+  private static final class CurrentDeviceUuidHolder {
+    private static final byte[] VALUE = Cuda.getGpuUuid();
+  }
+
+  private static final class ProcessNameHolder {
+    private static final String VALUE = ManagementFactory.getRuntimeMXBean().getName();
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/FloatUtils.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/FloatUtils.java
new file mode 100644
index 00000000000..4dfce5f74d1
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/FloatUtils.java
@@ -0,0 +1,88 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import ai.rapids.cudf.ColumnVector;
+import ai.rapids.cudf.ColumnView;
+import ai.rapids.cudf.DType;
+import ai.rapids.cudf.Scalar;
+
+public final class FloatUtils {
+  private FloatUtils() {}
+
+  public static ColumnVector nanToZero(ColumnView cv) {
+    if (cv.getType() != DType.FLOAT32 && cv.getType() != DType.FLOAT64) {
+      throw new IllegalArgumentException("Only Floats and Doubles allowed");
+    }
+
+    try (ColumnVector isNan = cv.isNan();
+         Scalar zero = cv.getType() == DType.FLOAT64
+             ? Scalar.fromDouble(0.0d)
+             : Scalar.fromFloat(0.0f)) {
+      return isNan.ifElse(zero, cv);
+    }
+  }
+
+  public static Scalar getNanScalar(DType dType) {
+    if (dType == DType.FLOAT64) {
+      return Scalar.fromDouble(Double.NaN);
+    } else if (dType == DType.FLOAT32) {
+      return Scalar.fromFloat(Float.NaN);
+    } else {
+      throw new IllegalArgumentException("NaNs are only supported for Float types");
+    }
+  }
+
+  public static Scalar getPositiveInfinityScalar(DType dType) {
+    if (dType == DType.FLOAT64) {
+      return Scalar.fromDouble(Double.POSITIVE_INFINITY);
+    } else {
+      return Scalar.fromFloat(Float.POSITIVE_INFINITY);
+    }
+  }
+
+  public static Scalar getNegativeInfinityScalar(DType dType) {
+    if (dType == DType.FLOAT64) {
+      return Scalar.fromDouble(Double.NEGATIVE_INFINITY);
+    } else {
+      return Scalar.fromFloat(Float.NEGATIVE_INFINITY);
+    }
+  }
+
+  public static ColumnVector getInfinityVector(DType dtype) {
+    if (dtype == DType.FLOAT64) {
+      return ColumnVector.fromDoubles(Double.POSITIVE_INFINITY, Double.NEGATIVE_INFINITY);
+    } else {
+      return ColumnVector.fromFloats(Float.POSITIVE_INFINITY, Float.NEGATIVE_INFINITY);
+    }
+  }
+
+  public static ColumnVector infinityToNulls(ColumnVector vec) {
+    try (ColumnVector infinityVector = getInfinityVector(vec.getType());
+         ColumnVector nullVector = getNullVector(vec.getType())) {
+      return vec.findAndReplaceAll(infinityVector, nullVector);
+    }
+  }
+
+  private static ColumnVector getNullVector(DType dtype) {
+    if (dtype == DType.FLOAT64) {
+      return ColumnVector.fromBoxedDoubles((Double) null, (Double) null);
+    } else {
+      return ColumnVector.fromBoxedFloats((Float) null, (Float) null);
+    }
+  }
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuColumnVectorBase.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuColumnVectorBase.java
similarity index 98%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuColumnVectorBase.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuColumnVectorBase.java
index 5d707cd9e12..8a0dc00a338 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuColumnVectorBase.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuColumnVectorBase.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuCompressedColumnVector.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuCompressedColumnVector.java
similarity index 90%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuCompressedColumnVector.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuCompressedColumnVector.java
index 1dc85cb2031..81abeb11eea 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuCompressedColumnVector.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuCompressedColumnVector.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -35,14 +35,6 @@ public final class GpuCompressedColumnVector extends GpuColumnVectorBase
   private final DeviceMemoryBuffer buffer;
   private final TableMeta tableMeta;
 
-  /**
-   * Build a columnar batch from a compressed table.
-   * NOTE: The data remains compressed and cannot be accessed directly from the columnar batch.
-   */
-  public static ColumnarBatch from(CompressedTable compressedTable) {
-    return from(compressedTable.buffer(), compressedTable.meta());
-  }
-
   public static boolean isBatchCompressed(ColumnarBatch batch) {
     return batch.numCols() == 1 && batch.column(0) instanceof GpuCompressedColumnVector;
   }
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuListUtils.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuListUtils.java
new file mode 100644
index 00000000000..a448cdaf7ba
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuListUtils.java
@@ -0,0 +1,59 @@
+/*
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Optional;
+
+import ai.rapids.cudf.ColumnView;
+import ai.rapids.cudf.DType;
+import ai.rapids.cudf.BaseDeviceMemoryBuffer;
+
+/** Provides APIs to manipulate array/list columns in common ways. */
+public final class GpuListUtils {
+  private GpuListUtils() {}
+
+  /**
+   * Replace the data column in a LIST column. This keeps the same offsets and validity
+   * of the list column. This returns a view, so the caller is responsible for keeping
+   * both {@code listCol} and {@code newDataCol} alive longer than the returned view.
+   *
+   * @param listCol the list column to use as a template
+   * @param newDataCol the new data column
+   * @return a new ColumnView
+   * @throws IllegalArgumentException if the data column does not match the original data column
+   *     in size
+   */
+  public static ColumnView replaceListDataColumnAsView(
+      ColumnView listCol, ColumnView newDataCol) {
+    assert DType.LIST.equals(listCol.getType());
+    try (ColumnView dataCol = listCol.getChildColumnView(0)) {
+      if (dataCol.getRowCount() != newDataCol.getRowCount()) {
+        throw new IllegalArgumentException("Mismatch in the number of rows in the data columns");
+      }
+    }
+    try (BaseDeviceMemoryBuffer offsets = listCol.getOffsets();
+         BaseDeviceMemoryBuffer validity = listCol.getValid()) {
+      return new ColumnView(
+          DType.LIST,
+          listCol.getRowCount(),
+          Optional.of(listCol.getNullCount()),
+          validity,
+          offsets,
+          new ColumnView[] { newDataCol });
+    }
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuOrcTimezoneUtils.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuOrcTimezoneUtils.java
new file mode 100644
index 00000000000..34cc1ac221f
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuOrcTimezoneUtils.java
@@ -0,0 +1,163 @@
+/*
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.time.LocalDateTime;
+import java.time.ZoneId;
+import java.util.ArrayList;
+import java.util.List;
+import java.util.Optional;
+
+import ai.rapids.cudf.ColumnVector;
+import ai.rapids.cudf.ColumnView;
+import ai.rapids.cudf.DType;
+import ai.rapids.cudf.Scalar;
+import ai.rapids.cudf.Table;
+
+public final class GpuOrcTimezoneUtils {
+  private static final ZoneId UTC = ZoneId.of("UTC");
+
+  private GpuOrcTimezoneUtils() {
+  }
+
+  /**
+   * Get the offset in microseconds for 2015-01-01 between JVM timezone and UTC timezone.
+   *
+   * @param jvmTz the JVM timezone to calculate the offset for
+   * @return the offset in microseconds between the JVM timezone and UTC timezone
+   */
+  private static long getOffsetForJanuaryFirst2015(ZoneId jvmTz) {
+    long t1 = LocalDateTime.of(2015, 1, 1, 0, 0, 0).atZone(jvmTz).toInstant()
+        .getEpochSecond();
+    long t2 = LocalDateTime.of(2015, 1, 1, 0, 0, 0).atZone(UTC).toInstant()
+        .getEpochSecond();
+    return (t2 - t1) * 1000000L;
+  }
+
+  private static <T extends ColumnView> T addToClose(List<ColumnView> toClose, T view) {
+    toClose.add(view);
+    return view;
+  }
+
+  /**
+   * Recursively rebase timestamp columns in an input column view to the target timezone.
+   * This handles nested list and struct types.
+   */
+  private static ColumnView rebaseTimestampRecursively(
+      ColumnView col,
+      List<ColumnView> toClose,
+      long diffMicros) {
+    DType dType = col.getType();
+    if (dType.hasTimeResolution()) {
+      assert dType.equals(DType.TIMESTAMP_MICROSECONDS) :
+          "Only TIMESTAMP_MICROSECONDS is supported, but got " + dType;
+
+      try (ColumnView longs = col.bitCastTo(DType.INT64);
+           Scalar offsetScalar = Scalar.fromLong(diffMicros);
+           ColumnVector rebased = longs.sub(offsetScalar)) {
+        return rebased.castTo(DType.TIMESTAMP_MICROSECONDS);
+      }
+    } else if (DType.LIST.equals(dType)) {
+      ColumnView child = addToClose(toClose, col.getChildColumnView(0));
+      ColumnView newChild = rebaseTimestampRecursively(child, toClose, diffMicros);
+      if (newChild != child) {
+        return col.replaceListChild(addToClose(toClose, newChild));
+      }
+      return col;
+    } else if (DType.STRUCT.equals(dType)) {
+      ColumnView[] newViews = new ColumnView[col.getNumChildren()];
+      for (int i = 0; i < newViews.length; i++) {
+        ColumnView child = addToClose(toClose, col.getChildColumnView(i));
+        ColumnView newChild = rebaseTimestampRecursively(child, toClose, diffMicros);
+        if (newChild != child) {
+          addToClose(toClose, newChild);
+        }
+        newViews[i] = newChild;
+      }
+      return new ColumnView(col.getType(), col.getRowCount(), Optional.of(col.getNullCount()),
+          col.getValid(), col.getOffsets(), newViews);
+    }
+    return col;
+  }
+
+  /**
+   * Rebase timestamp columns in the input table to the system default timezone. If the system's
+   * default timezone is UTC, this returns the input table as-is. Otherwise the input table is
+   * closed before returning.
+   *
+   * @param input the input table
+   * @return a table with timestamp columns rebased
+   */
+  public static Table rebaseTimeZone(Table input) {
+    ZoneId toZoneId = ZoneId.systemDefault();
+
+    if (UTC.equals(toZoneId)) {
+      return input;
+    }
+
+    long diffMicros = getOffsetForJanuaryFirst2015(toZoneId);
+    try (Table ignored = input) {
+      ColumnVector[] newColumns = new ColumnVector[input.getNumberOfColumns()];
+      try {
+        for (int colIdx = 0; colIdx < newColumns.length; colIdx++) {
+          ColumnVector col = input.getColumn(colIdx);
+          List<ColumnView> toClose = new ArrayList<>();
+          try {
+            ColumnView rebased = rebaseTimestampRecursively(col, toClose, diffMicros);
+            if (col == rebased) {
+              newColumns[colIdx] = col.incRefCount();
+            } else {
+              toClose.add(rebased);
+              newColumns[colIdx] = rebased.copyToColumnVector();
+            }
+          } finally {
+            closeAll(toClose);
+          }
+        }
+        return new Table(newColumns);
+      } finally {
+        closeAll(newColumns);
+      }
+    }
+  }
+
+  private static void closeAll(ColumnView[] views) {
+    for (ColumnView view : views) {
+      if (view != null) {
+        view.close();
+      }
+    }
+  }
+
+  private static void closeAll(List<ColumnView> views) {
+    RuntimeException firstException = null;
+    for (ColumnView view : views) {
+      try {
+        view.close();
+      } catch (RuntimeException e) {
+        if (firstException == null) {
+          firstException = e;
+        } else {
+          firstException.addSuppressed(e);
+        }
+      }
+    }
+    if (firstException != null) {
+      throw firstException;
+    }
+  }
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuPackedTableColumn.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuPackedTableColumn.java
similarity index 98%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuPackedTableColumn.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuPackedTableColumn.java
index 7c0b1a5a517..90ca8a5a908 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/GpuPackedTableColumn.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/GpuPackedTableColumn.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostAllocResult.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostAllocResult.java
new file mode 100644
index 00000000000..8cb8cf9f0a0
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostAllocResult.java
@@ -0,0 +1,61 @@
+/*
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+
+public class HostAllocResult {
+  public final HostMemoryBuffer buffer;
+  public final boolean isPinned;
+
+  public HostAllocResult(HostMemoryBuffer buffer, boolean isPinned) {
+    this.buffer = buffer;
+    this.isPinned = isPinned;
+  }
+
+  public HostMemoryBuffer buffer() {
+    return buffer;
+  }
+
+  public boolean isPinned() {
+    return isPinned;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof HostAllocResult)) {
+      return false;
+    }
+    HostAllocResult that = (HostAllocResult) other;
+    return isPinned == that.isPinned && Objects.equals(buffer, that.buffer);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(buffer, isPinned);
+  }
+
+  @Override
+  public String toString() {
+    return "HostAllocResult(" + buffer + "," + isPinned + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostByteBufferIterator.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostByteBufferIterator.java
new file mode 100644
index 00000000000..ebd5a0d9997
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostByteBufferIterator.java
@@ -0,0 +1,54 @@
+/*
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.nio.ByteBuffer;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+
+/**
+ * Create an iterator that will emit ByteBuffer instances sequentially to work around the 2GB
+ * ByteBuffer size limitation. This allows the entire address range of a >2GB host buffer to be
+ * covered by a sequence of ByteBuffer instances.
+ *
+ * NOTE: It is the caller's responsibility to ensure this iterator does not outlive the host buffer.
+ * The iterator DOES NOT increment the reference count of the host buffer to ensure it remains valid.
+ */
+public class HostByteBufferIterator extends AbstractHostByteBufferIterator {
+  private final HostMemoryBuffer hostBuffer;
+  private final long totalLength;
+
+  public HostByteBufferIterator(HostMemoryBuffer hostBuffer) {
+    this.hostBuffer = hostBuffer;
+    this.totalLength = hostBuffer == null ? 0 : hostBuffer.getLength();
+  }
+
+  @Override
+  public long limit() {
+    return Integer.MAX_VALUE;
+  }
+
+  @Override
+  public long totalLength() {
+    return totalLength;
+  }
+
+  @Override
+  public ByteBuffer getByteBuffer(long offset, long length) {
+    return hostBuffer.asByteBuffer(offset, (int) length);
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostMemoryInputStream.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostMemoryInputStream.java
new file mode 100644
index 00000000000..81c91ce3740
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostMemoryInputStream.java
@@ -0,0 +1,111 @@
+/*
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.IOException;
+import java.io.InputStream;
+import java.nio.ByteBuffer;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+
+/**
+ * An implementation of InputStream that reads from a HostMemoryBuffer.
+ *
+ * NOTE: Closing this input stream does NOT close the buffer!
+ */
+public class HostMemoryInputStream extends InputStream {
+  public final HostMemoryBuffer hmb;
+  public final long hmbLength;
+
+  protected long pos = 0;
+  protected long mark = -1;
+
+  public HostMemoryInputStream(HostMemoryBuffer hmb, long hmbLength) {
+    this.hmb = hmb;
+    this.hmbLength = hmbLength;
+  }
+
+  public HostMemoryBuffer hmb() {
+    return hmb;
+  }
+
+  public long hmbLength() {
+    return hmbLength;
+  }
+
+  @Override
+  public int read() {
+    if (pos >= hmbLength) {
+      return -1;
+    }
+    byte result = hmb.getByte(pos);
+    pos += 1;
+    // Java bytes are signed, so mask off the upper bits to avoid returning negative EOF values.
+    return result & 0xFF;
+  }
+
+  @Override
+  public int read(byte[] buffer, int offset, int length) {
+    if (pos >= hmbLength) {
+      return -1;
+    }
+    int numBytes = Math.min(available(), length);
+    hmb.getBytes(buffer, offset, pos, numBytes);
+    pos += numBytes;
+    return numBytes;
+  }
+
+  public ByteBuffer readByteBuffer(int length) {
+    ByteBuffer byteBuffer = hmb.asByteBuffer(pos, length);
+    pos += length;
+    return byteBuffer;
+  }
+
+  @Override
+  public long skip(long count) {
+    long oldPos = pos;
+    pos = Math.min(pos + count, hmbLength);
+    return pos - oldPos;
+  }
+
+  @Override
+  public int available() {
+    return (int) Math.min(hmbLength - pos, Integer.MAX_VALUE);
+  }
+
+  @Override
+  public void mark(int ignored) {
+    mark = pos;
+  }
+
+  @Override
+  public void reset() throws IOException {
+    if (mark <= 0) {
+      throw new IOException("reset called before mark");
+    }
+    pos = mark;
+  }
+
+  @Override
+  public boolean markSupported() {
+    return true;
+  }
+
+  public long getPos() {
+    return pos;
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostMemoryOutputStream.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostMemoryOutputStream.java
new file mode 100644
index 00000000000..25a95874e96
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/HostMemoryOutputStream.java
@@ -0,0 +1,100 @@
+/*
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.EOFException;
+import java.io.IOException;
+import java.io.OutputStream;
+import java.nio.ByteBuffer;
+import java.nio.channels.ReadableByteChannel;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+
+/**
+ * An implementation of OutputStream that writes to a HostMemoryBuffer.
+ *
+ * NOTE: Closing this output stream does NOT close the buffer!
+ */
+public class HostMemoryOutputStream extends OutputStream {
+  public final HostMemoryBuffer buffer;
+  protected long pos = 0;
+
+  public HostMemoryOutputStream(HostMemoryBuffer buffer) {
+    this.buffer = buffer;
+  }
+
+  public HostMemoryBuffer buffer() {
+    return buffer;
+  }
+
+  @Override
+  public void write(int i) {
+    buffer.setByte(pos, (byte) i);
+    pos += 1;
+  }
+
+  @Override
+  public void write(byte[] bytes) {
+    buffer.setBytes(pos, bytes, 0, bytes.length);
+    pos += bytes.length;
+  }
+
+  @Override
+  public void write(byte[] bytes, int offset, int len) {
+    buffer.setBytes(pos, bytes, offset, len);
+    pos += len;
+  }
+
+  public void write(ByteBuffer data) {
+    int numBytes = data.remaining();
+    ByteBuffer outBuffer = buffer.asByteBuffer(pos, numBytes);
+    outBuffer.put(data);
+    pos += numBytes;
+  }
+
+  public ByteBuffer writeAsByteBuffer(int length) {
+    ByteBuffer byteBuffer = buffer.asByteBuffer(pos, length);
+    pos += length;
+    return byteBuffer;
+  }
+
+  public long getPos() {
+    return pos;
+  }
+
+  public void seek(long newPos) {
+    pos = newPos;
+  }
+
+  public void copyFromChannel(ReadableByteChannel channel, long length) throws IOException {
+    long endPos = pos + length;
+    if (endPos > buffer.getLength()) {
+      throw new AssertionError();
+    }
+    while (pos != endPos) {
+      int bytesToCopy = (int) Math.min(endPos - pos, Integer.MAX_VALUE);
+      ByteBuffer byteBuffer = buffer.asByteBuffer(pos, bytesToCopy);
+      while (byteBuffer.hasRemaining()) {
+        int channelReadBytes = channel.read(byteBuffer);
+        if (channelReadBytes < 0) {
+          throw new EOFException("Unexpected EOF while reading from byte channel");
+        }
+      }
+      pos += bytesToCopy;
+    }
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MemoryBoundedPoolConf.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MemoryBoundedPoolConf.java
new file mode 100644
index 00000000000..781d7949132
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MemoryBoundedPoolConf.java
@@ -0,0 +1,80 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+public class MemoryBoundedPoolConf implements ThreadPoolConf {
+  private static final long serialVersionUID = 1L;
+
+  private final int maxThreadNumber;
+  private final boolean stageLevelPool;
+  private final long memoryCapacity;
+  private final long waitMemTimeoutMs;
+
+  public MemoryBoundedPoolConf(int maxThreadNumber, boolean stageLevelPool,
+      long memoryCapacity, long waitMemTimeoutMs) {
+    this.maxThreadNumber = maxThreadNumber;
+    this.stageLevelPool = stageLevelPool;
+    this.memoryCapacity = memoryCapacity;
+    this.waitMemTimeoutMs = waitMemTimeoutMs;
+  }
+
+  @Override
+  public int maxThreadNumber() {
+    return maxThreadNumber;
+  }
+
+  @Override
+  public boolean stageLevelPool() {
+    return stageLevelPool;
+  }
+
+  public long memoryCapacity() {
+    return memoryCapacity;
+  }
+
+  public long waitMemTimeoutMs() {
+    return waitMemTimeoutMs;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof MemoryBoundedPoolConf)) {
+      return false;
+    }
+    MemoryBoundedPoolConf that = (MemoryBoundedPoolConf) other;
+    return maxThreadNumber == that.maxThreadNumber &&
+        stageLevelPool == that.stageLevelPool &&
+        memoryCapacity == that.memoryCapacity &&
+        waitMemTimeoutMs == that.waitMemTimeoutMs;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(maxThreadNumber, stageLevelPool, memoryCapacity, waitMemTimeoutMs);
+  }
+
+  @Override
+  public String toString() {
+    return "MemoryBoundedPoolConf(" + maxThreadNumber + "," + stageLevelPool + "," +
+        memoryCapacity + "," + waitMemTimeoutMs + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MemoryBufferToHostByteBufferIterator.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MemoryBufferToHostByteBufferIterator.java
new file mode 100644
index 00000000000..3c6693767c2
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MemoryBufferToHostByteBufferIterator.java
@@ -0,0 +1,66 @@
+/*
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.nio.ByteBuffer;
+
+import ai.rapids.cudf.Cuda;
+import ai.rapids.cudf.HostMemoryBuffer;
+import ai.rapids.cudf.MemoryBuffer;
+
+/**
+ * Create an iterator that will emit ByteBuffer instances sequentially to work around the 2GB
+ * ByteBuffer size limitation after copying a MemoryBuffer to a host-backed bounce buffer.
+ *
+ * NOTE: It is the caller's responsibility to ensure this iterator does not outlive memoryBuffer.
+ * The iterator DOES NOT increment the reference count of memoryBuffer to ensure it remains valid.
+ */
+public class MemoryBufferToHostByteBufferIterator extends AbstractHostByteBufferIterator {
+  private final MemoryBuffer memoryBuffer;
+  private final HostMemoryBuffer bounceBuffer;
+  private final Cuda.Stream stream;
+  private final long totalLength;
+  private final long limit;
+
+  public MemoryBufferToHostByteBufferIterator(
+      MemoryBuffer memoryBuffer,
+      HostMemoryBuffer bounceBuffer,
+      Cuda.Stream stream) {
+    this.memoryBuffer = memoryBuffer;
+    this.bounceBuffer = bounceBuffer;
+    this.stream = stream;
+    this.totalLength = memoryBuffer == null ? 0 : memoryBuffer.getLength();
+    this.limit = Math.min(bounceBuffer.getLength(), Integer.MAX_VALUE);
+  }
+
+  @Override
+  public long totalLength() {
+    return totalLength;
+  }
+
+  @Override
+  public long limit() {
+    return limit;
+  }
+
+  @Override
+  public ByteBuffer getByteBuffer(long offset, long length) {
+    bounceBuffer.copyFromMemoryBufferAsync(0, memoryBuffer, offset, length, stream);
+    stream.sync();
+    return bounceBuffer.asByteBuffer(0, (int) length);
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MetricsBatchIterator.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MetricsBatchIterator.java
new file mode 100644
index 00000000000..7795165e5fa
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MetricsBatchIterator.java
@@ -0,0 +1,45 @@
+/*
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import scala.collection.Iterator;
+
+import org.apache.spark.TaskContext;
+import org.apache.spark.executor.InputMetrics;
+import org.apache.spark.sql.vectorized.ColumnarBatch;
+
+public class MetricsBatchIterator implements Iterator<ColumnarBatch> {
+  private final Iterator<ColumnarBatch> iter;
+  private final InputMetrics inputMetrics;
+
+  public MetricsBatchIterator(Iterator<ColumnarBatch> iter) {
+    this.iter = iter;
+    this.inputMetrics = TaskContext.get().taskMetrics().inputMetrics();
+  }
+
+  @Override
+  public boolean hasNext() {
+    return iter.hasNext();
+  }
+
+  @Override
+  public ColumnarBatch next() {
+    ColumnarBatch batch = iter.next();
+    inputMetrics.incRecordsRead(batch.numRows());
+    return batch;
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MutableBlockInfo.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MutableBlockInfo.java
new file mode 100644
index 00000000000..c2ed469f14a
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/MutableBlockInfo.java
@@ -0,0 +1,81 @@
+/*
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+/** Mutable Avro block metadata for iterator reuse. */
+public final class MutableBlockInfo implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private long blockSize;
+  private long dataSize;
+  private long count;
+
+  public MutableBlockInfo(long blockSize, long dataSize, long count) {
+    this.blockSize = blockSize;
+    this.dataSize = dataSize;
+    this.count = count;
+  }
+
+  public long blockSize() {
+    return blockSize;
+  }
+
+  public void setBlockSize(long blockSize) {
+    this.blockSize = blockSize;
+  }
+
+  public long dataSize() {
+    return dataSize;
+  }
+
+  public void setDataSize(long dataSize) {
+    this.dataSize = dataSize;
+  }
+
+  public long count() {
+    return count;
+  }
+
+  public void setCount(long count) {
+    this.count = count;
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof MutableBlockInfo)) {
+      return false;
+    }
+    MutableBlockInfo other = (MutableBlockInfo) obj;
+    return blockSize == other.blockSize && dataSize == other.dataSize && count == other.count;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(blockSize, dataSize, count);
+  }
+
+  @Override
+  public String toString() {
+    return "MutableBlockInfo(" + blockSize + "," + dataSize + "," + count + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/NullHostMemoryOutputStream.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/NullHostMemoryOutputStream.java
new file mode 100644
index 00000000000..09144654539
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/NullHostMemoryOutputStream.java
@@ -0,0 +1,50 @@
+/*
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.nio.channels.ReadableByteChannel;
+
+/** A HostMemoryOutputStream only counts the written bytes, nothing is actually written. */
+public final class NullHostMemoryOutputStream extends HostMemoryOutputStream {
+  public NullHostMemoryOutputStream() {
+    super(null);
+  }
+
+  @Override
+  public void write(int i) {
+    pos += 1;
+  }
+
+  @Override
+  public void write(byte[] bytes) {
+    pos += bytes.length;
+  }
+
+  @Override
+  public void write(byte[] bytes, int offset, int len) {
+    pos += len;
+  }
+
+  @Override
+  public void copyFromChannel(ReadableByteChannel channel, long length) {
+    long endPos = pos + length;
+    while (pos != endPos) {
+      long bytesToCopy = Math.min(endPos - pos, Integer.MAX_VALUE);
+      pos += bytesToCopy;
+    }
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/PartitionRowData.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/PartitionRowData.java
new file mode 100644
index 00000000000..c5ae84db178
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/PartitionRowData.java
@@ -0,0 +1,85 @@
+/*
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+import org.apache.spark.sql.catalyst.InternalRow;
+
+/** Partition value and replication count. */
+public final class PartitionRowData {
+  private final InternalRow rowValue;
+  private final int rowNum;
+
+  public PartitionRowData(InternalRow rowValue, int rowNum) {
+    this.rowValue = rowValue;
+    this.rowNum = rowNum;
+  }
+
+  public InternalRow rowValue() {
+    return rowValue;
+  }
+
+  public int rowNum() {
+    return rowNum;
+  }
+
+  public static PartitionRowData[] from(InternalRow[] rowValues, int[] rowNums) {
+    int length = Math.min(rowValues.length, rowNums.length);
+    PartitionRowData[] result = new PartitionRowData[length];
+    for (int i = 0; i < length; i++) {
+      result[i] = new PartitionRowData(rowValues[i], rowNums[i]);
+    }
+    return result;
+  }
+
+  public static PartitionRowData[] from(InternalRow[] rowValues, long[] rowNums) {
+    int length = Math.min(rowValues.length, rowNums.length);
+    PartitionRowData[] result = new PartitionRowData[length];
+    for (int i = 0; i < length; i++) {
+      long rowNum = rowNums[i];
+      if (rowNum > Integer.MAX_VALUE) {
+        throw new IllegalArgumentException(
+            "Row number " + rowNum + " exceeds max value of an integer.");
+      }
+      result[i] = new PartitionRowData(rowValues[i], (int) rowNum);
+    }
+    return result;
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof PartitionRowData)) {
+      return false;
+    }
+    PartitionRowData other = (PartitionRowData) obj;
+    return rowNum == other.rowNum && Objects.equals(rowValue, other.rowValue);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(rowValue, rowNum);
+  }
+
+  @Override
+  public String toString() {
+    return "PartitionRowData(" + rowValue + "," + rowNum + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileEndMsg.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileEndMsg.java
new file mode 100644
index 00000000000..c19651fa101
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileEndMsg.java
@@ -0,0 +1,62 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+public class ProfileEndMsg implements ProfileMsg {
+  private static final long serialVersionUID = 1L;
+
+  private final String executorId;
+  private final String path;
+
+  public ProfileEndMsg(String executorId, String path) {
+    this.executorId = executorId;
+    this.path = path;
+  }
+
+  public String executorId() {
+    return executorId;
+  }
+
+  public String path() {
+    return path;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof ProfileEndMsg)) {
+      return false;
+    }
+    ProfileEndMsg that = (ProfileEndMsg) other;
+    return Objects.equals(executorId, that.executorId) &&
+        Objects.equals(path, that.path);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(executorId, path);
+  }
+
+  @Override
+  public String toString() {
+    return "ProfileEndMsg(" + executorId + "," + path + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileErrorMsg.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileErrorMsg.java
new file mode 100644
index 00000000000..7aeeffc5c9d
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileErrorMsg.java
@@ -0,0 +1,62 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+public class ProfileErrorMsg implements ProfileMsg {
+  private static final long serialVersionUID = 1L;
+
+  private final String executorId;
+  private final String msg;
+
+  public ProfileErrorMsg(String executorId, String msg) {
+    this.executorId = executorId;
+    this.msg = msg;
+  }
+
+  public String executorId() {
+    return executorId;
+  }
+
+  public String msg() {
+    return msg;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof ProfileErrorMsg)) {
+      return false;
+    }
+    ProfileErrorMsg that = (ProfileErrorMsg) other;
+    return Objects.equals(executorId, that.executorId) &&
+        Objects.equals(msg, that.msg);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(executorId, msg);
+  }
+
+  @Override
+  public String toString() {
+    return "ProfileErrorMsg(" + executorId + "," + msg + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileInitMsg.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileInitMsg.java
new file mode 100644
index 00000000000..55a3b7627a7
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileInitMsg.java
@@ -0,0 +1,62 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+public class ProfileInitMsg implements ProfileMsg {
+  private static final long serialVersionUID = 1L;
+
+  private final String executorId;
+  private final String path;
+
+  public ProfileInitMsg(String executorId, String path) {
+    this.executorId = executorId;
+    this.path = path;
+  }
+
+  public String executorId() {
+    return executorId;
+  }
+
+  public String path() {
+    return path;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof ProfileInitMsg)) {
+      return false;
+    }
+    ProfileInitMsg that = (ProfileInitMsg) other;
+    return Objects.equals(executorId, that.executorId) &&
+        Objects.equals(path, that.path);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(executorId, path);
+  }
+
+  @Override
+  public String toString() {
+    return "ProfileInitMsg(" + executorId + "," + path + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileJobStageQueryMsg.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileJobStageQueryMsg.java
new file mode 100644
index 00000000000..dc2a8666a31
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileJobStageQueryMsg.java
@@ -0,0 +1,62 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+public class ProfileJobStageQueryMsg implements ProfileMsg {
+  private static final long serialVersionUID = 1L;
+
+  private final int[] activeJobs;
+  private final int[] activeStages;
+
+  public ProfileJobStageQueryMsg(int[] activeJobs, int[] activeStages) {
+    this.activeJobs = activeJobs;
+    this.activeStages = activeStages;
+  }
+
+  public int[] activeJobs() {
+    return activeJobs;
+  }
+
+  public int[] activeStages() {
+    return activeStages;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof ProfileJobStageQueryMsg)) {
+      return false;
+    }
+    ProfileJobStageQueryMsg that = (ProfileJobStageQueryMsg) other;
+    return Objects.equals(activeJobs, that.activeJobs) &&
+        Objects.equals(activeStages, that.activeStages);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(activeJobs, activeStages);
+  }
+
+  @Override
+  public String toString() {
+    return "ProfileJobStageQueryMsg(" + activeJobs + "," + activeStages + ")";
+  }
+}
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/errors/ConvUtils.scala b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileMsg.java
similarity index 57%
rename from sql-plugin/src/main/spark330/scala/org/apache/spark/sql/errors/ConvUtils.scala
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileMsg.java
index 745d878f141..1cbeababfbb 100644
--- a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/errors/ConvUtils.scala
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileMsg.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -14,19 +14,9 @@
  * limitations under the License.
  */
 
+package com.nvidia.spark.rapids;
 
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-spark-rapids-shim-json-lines ***/
-package org.apache.spark.sql.errors
+import java.io.Serializable;
 
-object ConvUtils {
-  // only Spark versions >= 340 support this function
-  def overflowInConvError(): Unit = throw new UnsupportedOperationException()
+public interface ProfileMsg extends Serializable {
 }
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileStatusMsg.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileStatusMsg.java
new file mode 100644
index 00000000000..b5db1431c36
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ProfileStatusMsg.java
@@ -0,0 +1,62 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.util.Objects;
+
+public class ProfileStatusMsg implements ProfileMsg {
+  private static final long serialVersionUID = 1L;
+
+  private final String executorId;
+  private final String msg;
+
+  public ProfileStatusMsg(String executorId, String msg) {
+    this.executorId = executorId;
+    this.msg = msg;
+  }
+
+  public String executorId() {
+    return executorId;
+  }
+
+  public String msg() {
+    return msg;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof ProfileStatusMsg)) {
+      return false;
+    }
+    ProfileStatusMsg that = (ProfileStatusMsg) other;
+    return Objects.equals(executorId, that.executorId) &&
+        Objects.equals(msg, that.msg);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(executorId, msg);
+  }
+
+  @Override
+  public String toString() {
+    return "ProfileStatusMsg(" + executorId + "," + msg + ")";
+  }
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnBuilder.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnBuilder.java
similarity index 99%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnBuilder.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnBuilder.java
index ee4ee81a386..51ba9b62888 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnBuilder.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnBuilder.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVector.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVector.java
similarity index 98%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVector.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVector.java
index c7913cd93e5..eae18071639 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVector.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVector.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVectorCore.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVectorCore.java
similarity index 99%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVectorCore.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVectorCore.java
index 87d92724e95..0f9900f1987 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVectorCore.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsHostColumnVectorCore.java
@@ -1,6 +1,6 @@
 
 /*
- * Copyright (c) 2020-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVector.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVector.java
similarity index 96%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVector.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVector.java
index 1eb1b1f66d7..1f79dd19596 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVector.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVector.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVectorCore.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVectorCore.java
similarity index 99%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVectorCore.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVectorCore.java
index d35bc9b96c5..459bc5af7f7 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVectorCore.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/RapidsNullSafeHostColumnVectorCore.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ShuffleBufferId.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ShuffleBufferId.java
new file mode 100644
index 00000000000..95b6d2d17d4
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ShuffleBufferId.java
@@ -0,0 +1,77 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+import org.apache.spark.storage.ShuffleBlockId;
+
+/** Identifier for a shuffle buffer that holds the data for a table. */
+public final class ShuffleBufferId implements Serializable {
+  private static final long serialVersionUID = 0L;
+
+  private final ShuffleBlockId blockId;
+  private final int tableId;
+  private final int shuffleId;
+  private final long mapId;
+
+  public ShuffleBufferId(ShuffleBlockId blockId, int tableId) {
+    this.blockId = blockId;
+    this.tableId = tableId;
+    this.shuffleId = blockId.shuffleId();
+    this.mapId = blockId.mapId();
+  }
+
+  public ShuffleBlockId blockId() {
+    return blockId;
+  }
+
+  public int tableId() {
+    return tableId;
+  }
+
+  public int shuffleId() {
+    return shuffleId;
+  }
+
+  public long mapId() {
+    return mapId;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof ShuffleBufferId)) {
+      return false;
+    }
+    ShuffleBufferId that = (ShuffleBufferId) other;
+    return tableId == that.tableId && Objects.equals(blockId, that.blockId);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(blockId, tableId);
+  }
+
+  @Override
+  public String toString() {
+    return "ShuffleBufferId(" + blockId + "," + tableId + ")";
+  }
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/SlicedGpuColumnVector.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SlicedGpuColumnVector.java
similarity index 99%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/SlicedGpuColumnVector.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SlicedGpuColumnVector.java
index 295eb182cd7..626a8bc6d14 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/SlicedGpuColumnVector.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SlicedGpuColumnVector.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/SlicedSerializedColumnVector.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SlicedSerializedColumnVector.java
similarity index 98%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/SlicedSerializedColumnVector.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SlicedSerializedColumnVector.java
index b8f4be5cd76..9dae9f0523e 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/SlicedSerializedColumnVector.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SlicedSerializedColumnVector.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SpillPriorities.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SpillPriorities.java
new file mode 100644
index 00000000000..10376cb7249
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/SpillPriorities.java
@@ -0,0 +1,66 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+/**
+ * Utility methods for managing spillable buffer priorities.
+ * The spill priority numerical space is divided into potentially overlapping ranges based on
+ * the type of buffer.
+ */
+public final class SpillPriorities {
+  /** Priorities for task output buffers intended for shuffle. */
+  public static final long OUTPUT_FOR_SHUFFLE_INITIAL_TASK_PRIORITY = Long.MIN_VALUE;
+
+  /**
+   * Priorities for buffers received from shuffle. Shuffle input buffers are about to be read by a
+   * task, so spill them if there's no other choice, but leave some space at the end of the priority
+   * range so there can be some things after it.
+   */
+  public static final long INPUT_FROM_SHUFFLE_PRIORITY = Long.MAX_VALUE - 1000;
+
+  /**
+   * Priority for buffers that are waiting for next to be called, i.e. data held between calls to
+   * {@code hasNext} and {@code next} or between different calls to {@code next}.
+   */
+  public static final long ACTIVE_ON_DECK_PRIORITY = INPUT_FROM_SHUFFLE_PRIORITY + 1;
+
+  /** Priority for multiple buffers being buffered within a call to next. */
+  public static final long ACTIVE_BATCHING_PRIORITY = ACTIVE_ON_DECK_PRIORITY + 100;
+
+  /** Priority offset for host memory buffers for spilling. */
+  public static final long HOST_MEMORY_BUFFER_SPILL_OFFSET = 0;
+
+  private SpillPriorities() {
+  }
+
+  /**
+   * Calculate a new priority based on an offset, clamping it to avoid wraparound.
+   *
+   * @param originalPriority the original priority
+   * @param offset the desired offset
+   * @return the resulting priority, with clamping if needed
+   */
+  public static long applyPriorityOffset(long originalPriority, long offset) {
+    if (offset < 0 && originalPriority < Long.MIN_VALUE - offset) {
+      return Long.MIN_VALUE;
+    } else if (offset > 0 && originalPriority > Long.MAX_VALUE - offset) {
+      return Long.MAX_VALUE;
+    } else {
+      return originalPriority + offset;
+    }
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/TableCompressionCodecConfig.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/TableCompressionCodecConfig.java
new file mode 100644
index 00000000000..62fef8edbc3
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/TableCompressionCodecConfig.java
@@ -0,0 +1,65 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+/**
+ * Codec-specific table compression settings.
+ */
+public class TableCompressionCodecConfig implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private final long lz4ChunkSize;
+  private final long zstdChunkSize;
+
+  public TableCompressionCodecConfig(long lz4ChunkSize, long zstdChunkSize) {
+    this.lz4ChunkSize = lz4ChunkSize;
+    this.zstdChunkSize = zstdChunkSize;
+  }
+
+  public long lz4ChunkSize() {
+    return lz4ChunkSize;
+  }
+
+  public long zstdChunkSize() {
+    return zstdChunkSize;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof TableCompressionCodecConfig)) {
+      return false;
+    }
+    TableCompressionCodecConfig that = (TableCompressionCodecConfig) other;
+    return lz4ChunkSize == that.lz4ChunkSize && zstdChunkSize == that.zstdChunkSize;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(lz4ChunkSize, zstdChunkSize);
+  }
+
+  @Override
+  public String toString() {
+    return "TableCompressionCodecConfig(" + lz4ChunkSize + "," + zstdChunkSize + ")";
+  }
+}
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/DateTimeUtilsShims.scala b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ThreadPoolConf.java
similarity index 62%
rename from sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/DateTimeUtilsShims.scala
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ThreadPoolConf.java
index 21254c4b39a..b2bed218f95 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/DateTimeUtilsShims.scala
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/ThreadPoolConf.java
@@ -14,18 +14,18 @@
  * limitations under the License.
  */
 
+package com.nvidia.spark.rapids;
 
-/*** spark-rapids-shim-json-lines
-{"spark": "400"}
-{"spark": "400db173"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
+import java.io.Serializable;
 
-import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils
+public interface ThreadPoolConf extends Serializable {
+  /**
+   * The maximum number of threads used by the thread pool, not necessarily the final number.
+   */
+  int maxThreadNumber();
 
-object DateTimeUtilsShims {
-  def currentTimestamp: Long = SparkDateTimeUtils.instantToMicros(java.time.Instant.now())
-}
\ No newline at end of file
+  /**
+   * Whether to create pools for each Spark stage, only for testing for now.
+   */
+  boolean stageLevelPool();
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/TypeConverter.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/TypeConverter.java
similarity index 100%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/TypeConverter.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/TypeConverter.java
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/WithTableBuffer.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/WithTableBuffer.java
similarity index 94%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/WithTableBuffer.java
rename to sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/WithTableBuffer.java
index eb1e1db5397..54359b96240 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/WithTableBuffer.java
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/WithTableBuffer.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/io/async/AsyncMetrics.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/io/async/AsyncMetrics.java
new file mode 100644
index 00000000000..bea87901510
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/io/async/AsyncMetrics.java
@@ -0,0 +1,66 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.io.async;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+/**
+ * Scheduling and execution timings for an async task.
+ */
+public class AsyncMetrics implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private final long scheduleTimeMs;
+  private final long executionTimeMs;
+
+  public AsyncMetrics(long scheduleTimeMs, long executionTimeMs) {
+    this.scheduleTimeMs = scheduleTimeMs;
+    this.executionTimeMs = executionTimeMs;
+  }
+
+  public long scheduleTimeMs() {
+    return scheduleTimeMs;
+  }
+
+  public long executionTimeMs() {
+    return executionTimeMs;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof AsyncMetrics)) {
+      return false;
+    }
+    AsyncMetrics that = (AsyncMetrics) other;
+    return scheduleTimeMs == that.scheduleTimeMs
+        && executionTimeMs == that.executionTimeMs;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(scheduleTimeMs, executionTimeMs);
+  }
+
+  @Override
+  public String toString() {
+    return "AsyncMetrics(" + scheduleTimeMs + "," + executionTimeMs + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/io/async/ThrottlingExecutorStats.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/io/async/ThrottlingExecutorStats.java
new file mode 100644
index 00000000000..40b86a6ad3e
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/io/async/ThrottlingExecutorStats.java
@@ -0,0 +1,71 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.io.async;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+/**
+ * Mutable throttling counters updated by ThrottlingExecutor.
+ */
+public class ThrottlingExecutorStats implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  public int numTasksScheduled;
+  public long accumulatedThrottleTimeNs;
+  public long minThrottleTimeNs;
+  public long maxThrottleTimeNs;
+
+  public ThrottlingExecutorStats(
+      int numTasksScheduled,
+      long accumulatedThrottleTimeNs,
+      long minThrottleTimeNs,
+      long maxThrottleTimeNs) {
+    this.numTasksScheduled = numTasksScheduled;
+    this.accumulatedThrottleTimeNs = accumulatedThrottleTimeNs;
+    this.minThrottleTimeNs = minThrottleTimeNs;
+    this.maxThrottleTimeNs = maxThrottleTimeNs;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof ThrottlingExecutorStats)) {
+      return false;
+    }
+    ThrottlingExecutorStats that = (ThrottlingExecutorStats) other;
+    return numTasksScheduled == that.numTasksScheduled
+        && accumulatedThrottleTimeNs == that.accumulatedThrottleTimeNs
+        && minThrottleTimeNs == that.minThrottleTimeNs
+        && maxThrottleTimeNs == that.maxThrottleTimeNs;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(
+        numTasksScheduled, accumulatedThrottleTimeNs, minThrottleTimeNs, maxThrottleTimeNs);
+  }
+
+  @Override
+  public String toString() {
+    return "ThrottlingExecutorStats(" + numTasksScheduled + ","
+        + accumulatedThrottleTimeNs + "," + minThrottleTimeNs + ","
+        + maxThrottleTimeNs + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/BlockRange.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/BlockRange.java
new file mode 100644
index 00000000000..1dcc97b5165
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/BlockRange.java
@@ -0,0 +1,81 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.shuffle;
+
+import java.util.Objects;
+
+/** Byte range for a block. */
+public final class BlockRange<T extends BlockWithSize> {
+  private final T block;
+  private final long rangeStart;
+  private final long rangeEnd;
+
+  public BlockRange(T block, long rangeStart, long rangeEnd) {
+    if (rangeStart >= rangeEnd) {
+      throw new IllegalArgumentException(
+          "requirement failed: Instantiated a BlockRange with invalid boundaries: " +
+              rangeStart + " to " + rangeEnd);
+    }
+    this.block = block;
+    this.rangeStart = rangeStart;
+    this.rangeEnd = rangeEnd;
+  }
+
+  public T block() {
+    return block;
+  }
+
+  public long rangeStart() {
+    return rangeStart;
+  }
+
+  public long rangeEnd() {
+    return rangeEnd;
+  }
+
+  public long rangeSize() {
+    return rangeEnd - rangeStart;
+  }
+
+  public boolean isComplete() {
+    return rangeEnd == block.size();
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof BlockRange)) {
+      return false;
+    }
+    BlockRange<?> other = (BlockRange<?>) obj;
+    return rangeStart == other.rangeStart &&
+        rangeEnd == other.rangeEnd &&
+        Objects.equals(block, other.block);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(block, rangeStart, rangeEnd);
+  }
+
+  @Override
+  public String toString() {
+    return "BlockRange(" + block + "," + rangeStart + "," + rangeEnd + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/BlockWithSize.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/BlockWithSize.java
new file mode 100644
index 00000000000..312f8198fef
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/BlockWithSize.java
@@ -0,0 +1,22 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.shuffle;
+
+/** Block-like value that can report its size in bytes. */
+public interface BlockWithSize {
+  long size();
+}
diff --git a/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/TransactionStats.java b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/TransactionStats.java
new file mode 100644
index 00000000000..75f4a0cef6e
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/com/nvidia/spark/rapids/shuffle/TransactionStats.java
@@ -0,0 +1,84 @@
+/*
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.shuffle;
+
+import java.util.Objects;
+
+/** Statistics for a shuffle transaction. */
+public final class TransactionStats {
+  private final double txTimeMs;
+  private final long sendSize;
+  private final long receiveSize;
+  private final double sendThroughput;
+  private final double recvThroughput;
+
+  public TransactionStats(double txTimeMs, long sendSize, long receiveSize,
+      double sendThroughput, double recvThroughput) {
+    this.txTimeMs = txTimeMs;
+    this.sendSize = sendSize;
+    this.receiveSize = receiveSize;
+    this.sendThroughput = sendThroughput;
+    this.recvThroughput = recvThroughput;
+  }
+
+  public double txTimeMs() {
+    return txTimeMs;
+  }
+
+  public long sendSize() {
+    return sendSize;
+  }
+
+  public long receiveSize() {
+    return receiveSize;
+  }
+
+  public double sendThroughput() {
+    return sendThroughput;
+  }
+
+  public double recvThroughput() {
+    return recvThroughput;
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof TransactionStats)) {
+      return false;
+    }
+    TransactionStats other = (TransactionStats) obj;
+    return Double.compare(txTimeMs, other.txTimeMs) == 0 &&
+        sendSize == other.sendSize &&
+        receiveSize == other.receiveSize &&
+        Double.compare(sendThroughput, other.sendThroughput) == 0 &&
+        Double.compare(recvThroughput, other.recvThroughput) == 0;
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(txTimeMs, sendSize, receiveSize, sendThroughput, recvThroughput);
+  }
+
+  @Override
+  public String toString() {
+    return "TransactionStats(" + txTimeMs + "," + sendSize + "," + receiveSize + "," +
+        sendThroughput + "," + recvThroughput + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/BasicColumnarWriteTaskStats.java b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/BasicColumnarWriteTaskStats.java
new file mode 100644
index 00000000000..7579ea33958
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/BasicColumnarWriteTaskStats.java
@@ -0,0 +1,98 @@
+/*
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.rapids;
+
+import java.util.Objects;
+
+import org.apache.spark.sql.catalyst.InternalRow;
+import org.apache.spark.sql.execution.datasources.WriteTaskStats;
+
+import scala.collection.Seq;
+
+/**
+ * Simple metrics collected during an instance of GpuFileFormatDataWriter.
+ * These were first introduced in https://github.com/apache/spark/pull/18159 (SPARK-20703).
+ */
+public final class BasicColumnarWriteTaskStats implements WriteTaskStats {
+  private static final long serialVersionUID = 0L;
+
+  private final Seq<InternalRow> partitions;
+  private final int numFiles;
+  private final int numWriters;
+  private final long numBytes;
+  private final long numRows;
+
+  public BasicColumnarWriteTaskStats(
+      Seq<InternalRow> partitions,
+      int numFiles,
+      int numWriters,
+      long numBytes,
+      long numRows) {
+    this.partitions = partitions;
+    this.numFiles = numFiles;
+    this.numWriters = numWriters;
+    this.numBytes = numBytes;
+    this.numRows = numRows;
+  }
+
+  public Seq<InternalRow> partitions() {
+    return partitions;
+  }
+
+  public int numFiles() {
+    return numFiles;
+  }
+
+  public int numWriters() {
+    return numWriters;
+  }
+
+  public long numBytes() {
+    return numBytes;
+  }
+
+  public long numRows() {
+    return numRows;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof BasicColumnarWriteTaskStats)) {
+      return false;
+    }
+    BasicColumnarWriteTaskStats that = (BasicColumnarWriteTaskStats) other;
+    return numFiles == that.numFiles
+        && numWriters == that.numWriters
+        && numBytes == that.numBytes
+        && numRows == that.numRows
+        && Objects.equals(partitions, that.partitions);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(partitions, numFiles, numWriters, numBytes, numRows);
+  }
+
+  @Override
+  public String toString() {
+    return "BasicColumnarWriteTaskStats(" + partitions + "," + numFiles + ","
+        + numWriters + "," + numBytes + "," + numRows + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/NanoTime.java b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/NanoTime.java
new file mode 100644
index 00000000000..d862ae90372
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/NanoTime.java
@@ -0,0 +1,63 @@
+/*
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.rapids;
+
+import java.io.Serializable;
+import java.util.Locale;
+import java.util.Objects;
+import java.util.concurrent.TimeUnit;
+
+public final class NanoTime implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private final Long value;
+
+  public NanoTime(Long value) {
+    this.value = value;
+  }
+
+  public Long value() {
+    return value;
+  }
+
+  @Override
+  public String toString() {
+    long hours = TimeUnit.NANOSECONDS.toHours(value);
+    long remaining = value - TimeUnit.HOURS.toNanos(hours);
+    long minutes = TimeUnit.NANOSECONDS.toMinutes(remaining);
+    remaining -= TimeUnit.MINUTES.toNanos(minutes);
+    double seconds = ((double) remaining) / TimeUnit.SECONDS.toNanos(1);
+    return String.format(Locale.US, "%02d:%02d:%06.3f", hours, minutes, seconds);
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof NanoTime)) {
+      return false;
+    }
+    NanoTime other = (NanoTime) obj;
+    return Objects.equals(value, other.value);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(value);
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/SizeInBytes.java b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/SizeInBytes.java
new file mode 100644
index 00000000000..7fb6c83f5e8
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/SizeInBytes.java
@@ -0,0 +1,68 @@
+/*
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.rapids;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+public final class SizeInBytes implements Serializable {
+  private static final long serialVersionUID = 1L;
+
+  private static final String[] SIZE_UNIT_NAMES = {"B", "KB", "MB", "GB", "TB", "PB", "EB"};
+
+  private final Long value;
+
+  public SizeInBytes(Long value) {
+    this.value = value;
+  }
+
+  public Long value() {
+    return value;
+  }
+
+  @Override
+  public String toString() {
+    long unitVal = value;
+    long remainVal = 0;
+    int unitIndex = 0;
+    while (unitIndex < SIZE_UNIT_NAMES.length && unitVal >= 1024) {
+      long nextUnitVal = unitVal >> 10;
+      remainVal = unitVal - (nextUnitVal << 10);
+      unitVal = nextUnitVal;
+      unitIndex += 1;
+    }
+    String finalVal = String.format("%.2f", unitVal + (remainVal / 1024.0));
+    return finalVal + SIZE_UNIT_NAMES[unitIndex] + " (" + value + " bytes)";
+  }
+
+  @Override
+  public boolean equals(Object obj) {
+    if (this == obj) {
+      return true;
+    }
+    if (!(obj instanceof SizeInBytes)) {
+      return false;
+    }
+    SizeInBytes other = (SizeInBytes) obj;
+    return Objects.equals(value, other.value);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(value);
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/execution/JoinCardinalityStats.java b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/execution/JoinCardinalityStats.java
new file mode 100644
index 00000000000..8cd8a0c4cfc
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/execution/JoinCardinalityStats.java
@@ -0,0 +1,128 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.rapids.execution;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+import org.apache.spark.sql.types.DataType;
+
+import scala.collection.Seq;
+
+/** Statistics for join cardinality logging to help diagnose performance issues. */
+public final class JoinCardinalityStats implements Serializable {
+  private static final long serialVersionUID = 0L;
+
+  private final long leftRowCount;
+  private final long rightRowCount;
+  private final long leftDistinctCount;
+  private final long rightDistinctCount;
+  private final Seq<?> leftNullCounts;
+  private final Seq<?> rightNullCounts;
+  private final Seq<DataType> leftKeyTypes;
+  private final Seq<DataType> rightKeyTypes;
+
+  public JoinCardinalityStats(
+      long leftRowCount,
+      long rightRowCount,
+      long leftDistinctCount,
+      long rightDistinctCount,
+      Seq<?> leftNullCounts,
+      Seq<?> rightNullCounts,
+      Seq<DataType> leftKeyTypes,
+      Seq<DataType> rightKeyTypes) {
+    this.leftRowCount = leftRowCount;
+    this.rightRowCount = rightRowCount;
+    this.leftDistinctCount = leftDistinctCount;
+    this.rightDistinctCount = rightDistinctCount;
+    this.leftNullCounts = leftNullCounts;
+    this.rightNullCounts = rightNullCounts;
+    this.leftKeyTypes = leftKeyTypes;
+    this.rightKeyTypes = rightKeyTypes;
+  }
+
+  public long leftRowCount() {
+    return leftRowCount;
+  }
+
+  public long rightRowCount() {
+    return rightRowCount;
+  }
+
+  public long leftDistinctCount() {
+    return leftDistinctCount;
+  }
+
+  public long rightDistinctCount() {
+    return rightDistinctCount;
+  }
+
+  public Seq<?> leftNullCounts() {
+    return leftNullCounts;
+  }
+
+  public Seq<?> rightNullCounts() {
+    return rightNullCounts;
+  }
+
+  public Seq<DataType> leftKeyTypes() {
+    return leftKeyTypes;
+  }
+
+  public Seq<DataType> rightKeyTypes() {
+    return rightKeyTypes;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof JoinCardinalityStats)) {
+      return false;
+    }
+    JoinCardinalityStats that = (JoinCardinalityStats) other;
+    return leftRowCount == that.leftRowCount
+        && rightRowCount == that.rightRowCount
+        && leftDistinctCount == that.leftDistinctCount
+        && rightDistinctCount == that.rightDistinctCount
+        && Objects.equals(leftNullCounts, that.leftNullCounts)
+        && Objects.equals(rightNullCounts, that.rightNullCounts)
+        && Objects.equals(leftKeyTypes, that.leftKeyTypes)
+        && Objects.equals(rightKeyTypes, that.rightKeyTypes);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(
+        leftRowCount,
+        rightRowCount,
+        leftDistinctCount,
+        rightDistinctCount,
+        leftNullCounts,
+        rightNullCounts,
+        leftKeyTypes,
+        rightKeyTypes);
+  }
+
+  @Override
+  public String toString() {
+    return "JoinCardinalityStats(" + leftRowCount + "," + rightRowCount + ","
+        + leftDistinctCount + "," + rightDistinctCount + "," + leftNullCounts + ","
+        + rightNullCounts + "," + leftKeyTypes + "," + rightKeyTypes + ")";
+  }
+}
diff --git a/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/execution/JoinOptions.java b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/execution/JoinOptions.java
new file mode 100644
index 00000000000..be0487ecde7
--- /dev/null
+++ b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/rapids/execution/JoinOptions.java
@@ -0,0 +1,94 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.rapids.execution;
+
+import java.io.Serializable;
+import java.util.Objects;
+
+import scala.Enumeration.Value;
+
+/** Options to control join behavior. */
+public final class JoinOptions implements Serializable {
+  private static final long serialVersionUID = 0L;
+
+  private final Value strategy;
+  private final Value buildSideSelection;
+  private final long targetSize;
+  private final boolean logCardinalityEnabled;
+  private final double sizeEstimateThreshold;
+
+  public JoinOptions(
+      Value strategy,
+      Value buildSideSelection,
+      long targetSize,
+      boolean logCardinalityEnabled,
+      double sizeEstimateThreshold) {
+    this.strategy = strategy;
+    this.buildSideSelection = buildSideSelection;
+    this.targetSize = targetSize;
+    this.logCardinalityEnabled = logCardinalityEnabled;
+    this.sizeEstimateThreshold = sizeEstimateThreshold;
+  }
+
+  public Value strategy() {
+    return strategy;
+  }
+
+  public Value buildSideSelection() {
+    return buildSideSelection;
+  }
+
+  public long targetSize() {
+    return targetSize;
+  }
+
+  public boolean logCardinalityEnabled() {
+    return logCardinalityEnabled;
+  }
+
+  public double sizeEstimateThreshold() {
+    return sizeEstimateThreshold;
+  }
+
+  @Override
+  public boolean equals(Object other) {
+    if (this == other) {
+      return true;
+    }
+    if (!(other instanceof JoinOptions)) {
+      return false;
+    }
+    JoinOptions that = (JoinOptions) other;
+    return targetSize == that.targetSize
+        && logCardinalityEnabled == that.logCardinalityEnabled
+        && Double.compare(that.sizeEstimateThreshold, sizeEstimateThreshold) == 0
+        && Objects.equals(strategy, that.strategy)
+        && Objects.equals(buildSideSelection, that.buildSideSelection);
+  }
+
+  @Override
+  public int hashCode() {
+    return Objects.hash(
+        strategy, buildSideSelection, targetSize, logCardinalityEnabled, sizeEstimateThreshold);
+  }
+
+  @Override
+  public String toString() {
+    return "JoinOptions(" + strategy + "," + buildSideSelection + "," + targetSize + ","
+        + logCardinalityEnabled + "," + sizeEstimateThreshold + ")";
+  }
+}
diff --git a/sql-plugin/src/main/java/org/apache/spark/sql/vectorized/rapids/AccessibleArrowColumnVector.java b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/vectorized/rapids/AccessibleArrowColumnVector.java
similarity index 99%
rename from sql-plugin/src/main/java/org/apache/spark/sql/vectorized/rapids/AccessibleArrowColumnVector.java
rename to sql-plugin-columnar/src/main/java/org/apache/spark/sql/vectorized/rapids/AccessibleArrowColumnVector.java
index 514f11316af..78fb986b307 100644
--- a/sql-plugin/src/main/java/org/apache/spark/sql/vectorized/rapids/AccessibleArrowColumnVector.java
+++ b/sql-plugin-columnar/src/main/java/org/apache/spark/sql/vectorized/rapids/AccessibleArrowColumnVector.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin-fileio/pom.xml b/sql-plugin-fileio/pom.xml
new file mode 100644
index 00000000000..e45d88fa79e
--- /dev/null
+++ b/sql-plugin-fileio/pom.xml
@@ -0,0 +1,118 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.12</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+
+    <artifactId>rapids-4-spark-sql-plugin-fileio_2.12</artifactId>
+    <description>Java-only file I/O runtime plumbing for the RAPIDS SQL plugin</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-fileio</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+        <rapids.shimplify.skip>true</rapids.shimplify.skip>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>spark-rapids-jni</artifactId>
+            <classifier>${jni.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>org.apache.spark</groupId>
+            <artifactId>spark-core_${scala.binary.version}</artifactId>
+            <version>${spark.version}</version>
+            <scope>provided</scope>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>default-compile</id>
+                        <phase>compile</phase>
+                        <goals>
+                            <goal>compile</goal>
+                        </goals>
+                    </execution>
+                    <execution>
+                        <id>default-testCompile</id>
+                        <phase>test-compile</phase>
+                        <goals>
+                            <goal>testCompile</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <release>${java.major.version}</release>
+                    <compilerArgs>
+                        <arg>-Xlint:all,-serial,-path,-try,-processing</arg>
+                    </compilerArgs>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>eclipse-add-source</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-test-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>attach-scaladocs</id>
+                        <phase>none</phase>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <configuration>
+                    <skipTests>true</skipTests>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/FileUtils.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/FileUtils.java
new file mode 100644
index 00000000000..06059b11e50
--- /dev/null
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/FileUtils.java
@@ -0,0 +1,65 @@
+/*
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import java.io.IOException;
+import java.util.Random;
+
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.FSDataOutputStream;
+import org.apache.hadoop.fs.FileAlreadyExistsException;
+import org.apache.hadoop.fs.FileSystem;
+import org.apache.hadoop.fs.Path;
+
+public final class FileUtils {
+  private FileUtils() {}
+
+  public static final class TempFile {
+    private final FSDataOutputStream outputStream;
+    private final Path path;
+
+    TempFile(FSDataOutputStream outputStream, Path path) {
+      this.outputStream = outputStream;
+      this.path = path;
+    }
+
+    public FSDataOutputStream getOutputStream() {
+      return outputStream;
+    }
+
+    public Path getPath() {
+      return path;
+    }
+  }
+
+  public static TempFile createTempFile(
+      Configuration conf, String pathPrefix, String pathSuffix) throws IOException {
+    FileSystem fs = new Path(pathPrefix).getFileSystem(conf);
+    Random rnd = new Random();
+    String suffix = pathSuffix != null ? pathSuffix : "";
+    while (true) {
+      Path path = new Path(pathPrefix + rnd.nextInt(Integer.MAX_VALUE) + suffix);
+      if (!fs.exists(path)) {
+        try {
+          return new TempFile(fs.create(path, false), path);
+        } catch (FileAlreadyExistsException e) {
+          // Retry if another writer won the race between exists and create.
+        }
+      }
+    }
+  }
+}
diff --git a/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/RapidsInputFiles.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/RapidsInputFiles.java
new file mode 100644
index 00000000000..407bdd03fa6
--- /dev/null
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/RapidsInputFiles.java
@@ -0,0 +1,116 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.fileio;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+import com.nvidia.spark.rapids.jni.fileio.RapidsInputFile;
+import org.apache.hadoop.conf.Configuration;
+
+import java.io.IOException;
+import java.net.URI;
+import java.util.List;
+import java.util.Objects;
+
+/**
+ * Static helpers shared by {@link RapidsInputFile} implementations.
+ */
+public final class RapidsInputFiles {
+    private static final S3PerfReader DISABLED_S3_PERF_READER = new S3PerfReader() {
+        @Override
+        public boolean isEnabled() {
+            return false;
+        }
+
+        @Override
+        public boolean readVectored(
+                Configuration hadoopConf,
+                URI fileUri,
+                HostMemoryBuffer output,
+                List<RapidsInputFile.CopyRange> copyRanges) {
+            return false;
+        }
+
+        @Override
+        public boolean readTail(
+                Configuration hadoopConf,
+                URI fileUri,
+                HostMemoryBuffer output,
+                long length,
+                long outputOffset) {
+            return false;
+        }
+    };
+
+    private static volatile S3PerfReader s3PerfReader = DISABLED_S3_PERF_READER;
+
+    private RapidsInputFiles() {}
+
+    /**
+     * Java bridge for S3 PerfIO integration. The implementation lives in sql-plugin
+     * because it depends on private Scala PerfIO state.
+     */
+    public interface S3PerfReader {
+        boolean isEnabled();
+
+        boolean readVectored(
+                Configuration hadoopConf,
+                URI fileUri,
+                HostMemoryBuffer output,
+                List<RapidsInputFile.CopyRange> copyRanges) throws IOException;
+
+        boolean readTail(
+                Configuration hadoopConf,
+                URI fileUri,
+                HostMemoryBuffer output,
+                long length,
+                long outputOffset) throws IOException;
+    }
+
+    public static void setS3PerfReader(S3PerfReader reader) {
+        s3PerfReader = Objects.requireNonNull(reader, "reader can't be null");
+    }
+
+    public static void resetS3PerfReader() {
+        s3PerfReader = DISABLED_S3_PERF_READER;
+    }
+
+    /**
+     * True iff the active SQL-plugin bridge says the S3 PerfIO path is enabled.
+     * Returns false before the bridge is registered so callers default to the
+     * non-PerfIO path during early bring-up.
+     */
+    public static boolean isS3PerfEnabled() {
+        return s3PerfReader.isEnabled();
+    }
+
+    public static boolean readS3Vectored(
+            Configuration hadoopConf,
+            URI fileUri,
+            HostMemoryBuffer output,
+            List<RapidsInputFile.CopyRange> copyRanges) throws IOException {
+        return s3PerfReader.readVectored(hadoopConf, fileUri, output, copyRanges);
+    }
+
+    public static boolean readS3Tail(
+            Configuration hadoopConf,
+            URI fileUri,
+            HostMemoryBuffer output,
+            long length,
+            long outputOffset) throws IOException {
+        return s3PerfReader.readTail(hadoopConf, fileUri, output, length, outputOffset);
+    }
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopFileIO.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopFileIO.java
similarity index 75%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopFileIO.java
rename to sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopFileIO.java
index dd9da173280..f17730211a7 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopFileIO.java
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopFileIO.java
@@ -16,12 +16,10 @@
 
 package com.nvidia.spark.rapids.fileio.hadoop;
 
-import com.nvidia.spark.rapids.fileio.RapidsInputFiles;
 import com.nvidia.spark.rapids.jni.fileio.RapidsFileIO;
 import com.nvidia.spark.rapids.jni.fileio.RapidsInputFile;
 import com.nvidia.spark.rapids.jni.fileio.RapidsOutputFile;
 import org.apache.hadoop.conf.Configuration;
-import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.Path;
 import org.apache.spark.util.SerializableConfiguration;
 
@@ -34,9 +32,18 @@
  */
 public class HadoopFileIO implements RapidsFileIO {
     private final SerializableConfiguration hadoopConf;
+    private final HadoopInputFileFactory inputFileFactory;
 
     public HadoopFileIO(Configuration hadoopConf) {
         Objects.requireNonNull(hadoopConf, "hadoopConf can't be null");
+        this.inputFileFactory = null;
+        this.hadoopConf = new SerializableConfiguration(hadoopConf);
+    }
+
+    public HadoopFileIO(Configuration hadoopConf, HadoopInputFileFactory inputFileFactory) {
+        Objects.requireNonNull(hadoopConf, "hadoopConf can't be null");
+        this.inputFileFactory = Objects.requireNonNull(
+                inputFileFactory, "inputFileFactory can't be null");
         this.hadoopConf = new SerializableConfiguration(hadoopConf);
     }
 
@@ -47,9 +54,9 @@ public RapidsInputFile newInputFile(String path) throws IOException {
 
     @Override
     public RapidsInputFile newInputFile(Path path) throws IOException {
-        String scheme = path.toUri().getScheme();
-        if (scheme != null && scheme.startsWith("s3") && RapidsInputFiles.isS3PerfEnabled()) {
-            return S3InputFile.create(path, hadoopConf.value());
+        Objects.requireNonNull(path, "path can't be null");
+        if (inputFileFactory != null) {
+            return inputFileFactory.create(path, hadoopConf.value());
         }
         return HadoopInputFile.create(path, hadoopConf.value());
     }
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFile.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFile.java
similarity index 98%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFile.java
rename to sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFile.java
index a1688b50be3..25ab03e2a7b 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFile.java
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFile.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFileFactory.java
similarity index 50%
rename from sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala
rename to sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFileFactory.java
index e361720f76a..972a2ce103c 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputFileFactory.java
@@ -13,24 +13,21 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-/*** spark-rapids-shim-json-lines
-{"spark": "400"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
 
-import com.nvidia.spark.rapids.{GpuExec, GpuWrite}
+package com.nvidia.spark.rapids.fileio.hadoop;
 
-import org.apache.spark.sql.execution.SparkPlan
-import org.apache.spark.sql.execution.datasources.v2.{GpuReplaceDataExec, ReplaceDataExec}
+import com.nvidia.spark.rapids.jni.fileio.RapidsInputFile;
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.Path;
 
-object ReplaceDataExecShim {
-  def convertToGpu(
-      cpuExec: ReplaceDataExec,
-      childPlan: SparkPlan,
-      gpuWrite: GpuWrite): GpuExec = {
-    GpuReplaceDataExec(childPlan, cpuExec.refreshCache, cpuExec.projections, gpuWrite)
-  }
+import java.io.IOException;
+import java.io.Serializable;
+
+/**
+ * Serializable extension point for callers that want to replace Hadoop input
+ * files with an optimized implementation for selected paths.
+ */
+@FunctionalInterface
+public interface HadoopInputFileFactory extends Serializable {
+    RapidsInputFile create(Path path, Configuration conf) throws IOException;
 }
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputStream.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputStream.java
similarity index 97%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputStream.java
rename to sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputStream.java
index 289e6dc0355..18b3c464da8 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputStream.java
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopInputStream.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputFile.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputFile.java
similarity index 97%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputFile.java
rename to sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputFile.java
index 3ed1146eefa..f24f77d0fe5 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputFile.java
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputFile.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputStream.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputStream.java
similarity index 97%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputStream.java
rename to sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputStream.java
index 301570fba1f..9b628bc826f 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputStream.java
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/HadoopOutputStream.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/PerfIOHadoopInputFileFactory.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/PerfIOHadoopInputFileFactory.java
new file mode 100644
index 00000000000..2fcd6d896af
--- /dev/null
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/PerfIOHadoopInputFileFactory.java
@@ -0,0 +1,44 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.fileio.hadoop;
+
+import com.nvidia.spark.rapids.fileio.RapidsInputFiles;
+import com.nvidia.spark.rapids.jni.fileio.RapidsInputFile;
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.Path;
+
+import java.io.IOException;
+
+/** Hadoop input factory that routes S3 paths through the registered PerfIO bridge. */
+public final class PerfIOHadoopInputFileFactory implements HadoopInputFileFactory {
+    public static final PerfIOHadoopInputFileFactory INSTANCE = new PerfIOHadoopInputFileFactory();
+
+    private PerfIOHadoopInputFileFactory() {}
+
+    @Override
+    public RapidsInputFile create(Path path, Configuration conf) throws IOException {
+        String scheme = path.toUri().getScheme();
+        if (scheme != null && scheme.startsWith("s3") && RapidsInputFiles.isS3PerfEnabled()) {
+            return S3InputFile.create(path, conf);
+        }
+        return HadoopInputFile.create(path, conf);
+    }
+
+    private Object readResolve() {
+        return INSTANCE;
+    }
+}
diff --git a/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/S3InputFile.java b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/S3InputFile.java
new file mode 100644
index 00000000000..d9932bfda4e
--- /dev/null
+++ b/sql-plugin-fileio/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/S3InputFile.java
@@ -0,0 +1,97 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.fileio.hadoop;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+import com.nvidia.spark.rapids.fileio.RapidsInputFiles;
+import com.nvidia.spark.rapids.jni.fileio.RapidsInputFile;
+import com.nvidia.spark.rapids.jni.fileio.SeekableInputStream;
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.Path;
+
+import java.io.IOException;
+import java.net.URI;
+import java.util.List;
+import java.util.OptionalLong;
+
+/**
+ * S3-backed {@link RapidsInputFile} for Hadoop-conf-driven (non-iceberg) reads.
+ * {@code readVectored} issues batched byte-range GETs through the optimized
+ * vectored-read path; the other operations delegate to the standard
+ * {@link HadoopInputFile}.
+ */
+public class S3InputFile implements RapidsInputFile {
+    private final HadoopInputFile delegate;
+    private final URI fileUri;
+    private final Configuration hadoopConf;
+
+    public static S3InputFile create(Path filePath, Configuration conf) throws IOException {
+        return new S3InputFile(HadoopInputFile.create(filePath, conf), filePath.toUri(), conf);
+    }
+
+    private S3InputFile(HadoopInputFile delegate, URI fileUri, Configuration hadoopConf) {
+        this.delegate = delegate;
+        this.fileUri = fileUri;
+        this.hadoopConf = hadoopConf;
+    }
+
+    @Override
+    public String path() {
+        return delegate.path();
+    }
+
+    @Override
+    public long getLength() throws IOException {
+        return delegate.getLength();
+    }
+
+    @Override
+    public OptionalLong getLastModificationTime() throws IOException {
+        return delegate.getLastModificationTime();
+    }
+
+    @Override
+    public SeekableInputStream open() throws IOException {
+        return delegate.open();
+    }
+
+    @Override
+    public void readVectored(HostMemoryBuffer output, List<RapidsInputFile.CopyRange> copyRanges)
+            throws IOException {
+        if (!RapidsInputFiles.readS3Vectored(hadoopConf, fileUri, output, copyRanges)) {
+            throw new IllegalArgumentException("expected to use PerfIO to read");
+        }
+    }
+
+    /**
+     * Issue a single suffix-range {@code GetObject} ({@code Range: bytes=-N}) for
+     * the last {@code length} bytes. Avoids the {@code getLength()} round-trip the
+     * default {@link RapidsInputFile#readTail} would make.
+     */
+    @Override
+    public void readTail(long length, HostMemoryBuffer output) throws IOException {
+        if (length == 0) {
+            return;
+        }
+        if (length < 0) {
+            throw new IllegalArgumentException("length must be non-negative");
+        }
+        if (!RapidsInputFiles.readS3Tail(hadoopConf, fileUri, output, length, 0L)) {
+            throw new IllegalArgumentException("expected to use PerfIO to read");
+        }
+    }
+}
diff --git a/sql-plugin-format/pom.xml b/sql-plugin-format/pom.xml
new file mode 100644
index 00000000000..8535478f125
--- /dev/null
+++ b/sql-plugin-format/pom.xml
@@ -0,0 +1,111 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.12</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+
+    <artifactId>rapids-4-spark-sql-plugin-format_2.12</artifactId>
+    <description>Java-only FlatBuffers format classes for the RAPIDS SQL plugin</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-format</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+        <rapids.shimplify.skip>true</rapids.shimplify.skip>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.google.flatbuffers</groupId>
+            <artifactId>flatbuffers-java</artifactId>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-compiler-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>default-compile</id>
+                        <phase>compile</phase>
+                        <goals>
+                            <goal>compile</goal>
+                        </goals>
+                    </execution>
+                    <execution>
+                        <id>default-testCompile</id>
+                        <phase>test-compile</phase>
+                        <goals>
+                            <goal>testCompile</goal>
+                        </goals>
+                    </execution>
+                </executions>
+                <configuration>
+                    <release>${java.major.version}</release>
+                    <compilerArgs>
+                        <arg>-Xlint:all,-serial,-path,-try,-processing</arg>
+                    </compilerArgs>
+                </configuration>
+            </plugin>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+                <executions>
+                    <execution>
+                        <id>eclipse-add-source</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>scala-test-compile-first</id>
+                        <phase>none</phase>
+                    </execution>
+                    <execution>
+                        <id>attach-scaladocs</id>
+                        <phase>none</phase>
+                    </execution>
+                </executions>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-surefire-plugin</artifactId>
+                <configuration>
+                    <skipTests>true</skipTests>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BlockIdMeta.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BlockIdMeta.java
similarity index 83%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BlockIdMeta.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BlockIdMeta.java
index ed28904a876..b43473f0b14 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BlockIdMeta.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BlockIdMeta.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -49,4 +65,3 @@ public static int endBlockIdMeta(FlatBufferBuilder builder) {
     return o;
   }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferMeta.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferMeta.java
similarity index 85%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferMeta.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferMeta.java
index ea8ea94ce93..0e040e9da42 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferMeta.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferMeta.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -61,4 +77,3 @@ public static int endBufferMeta(FlatBufferBuilder builder) {
     return o;
   }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferTransferRequest.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferTransferRequest.java
similarity index 74%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferTransferRequest.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferTransferRequest.java
index 38d8e0995dd..71f4dfff4ce 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferTransferRequest.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferTransferRequest.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -34,4 +50,3 @@ public static int endBufferTransferRequest(FlatBufferBuilder builder) {
     return o;
   }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferTransferResponse.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferTransferResponse.java
similarity index 82%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferTransferResponse.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferTransferResponse.java
index a3cbda453d4..8a074fcc127 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/BufferTransferResponse.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/BufferTransferResponse.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -50,4 +66,3 @@ public static int endBufferTransferResponse(FlatBufferBuilder builder) {
     return o;
   }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/CodecBufferDescriptor.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/CodecBufferDescriptor.java
similarity index 87%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/CodecBufferDescriptor.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/CodecBufferDescriptor.java
index 681cc7ab31d..3bb1a2bd4ad 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/CodecBufferDescriptor.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/CodecBufferDescriptor.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -71,4 +87,3 @@ public static int endCodecBufferDescriptor(FlatBufferBuilder builder) {
     return o;
   }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/CodecType.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/CodecType.java
similarity index 55%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/CodecType.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/CodecType.java
index 1451e1221a4..762773e618d 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/CodecType.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/CodecType.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -25,4 +41,3 @@ private CodecType() { }
 
   public static String name(int e) { return names[e - COPY]; }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/MetadataRequest.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/MetadataRequest.java
similarity index 80%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/MetadataRequest.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/MetadataRequest.java
index 301d1a9a682..84f2b9f4cd1 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/MetadataRequest.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/MetadataRequest.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -42,4 +58,3 @@ public static int endMetadataRequest(FlatBufferBuilder builder) {
   public static void finishMetadataRequestBuffer(FlatBufferBuilder builder, int offset) { builder.finish(offset); }
   public static void finishSizePrefixedMetadataRequestBuffer(FlatBufferBuilder builder, int offset) { builder.finishSizePrefixed(offset); }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/MetadataResponse.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/MetadataResponse.java
similarity index 80%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/MetadataResponse.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/MetadataResponse.java
index 63d2cdd311b..bb9fdd0a0a3 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/MetadataResponse.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/MetadataResponse.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -42,4 +58,3 @@ public static int endMetadataResponse(FlatBufferBuilder builder) {
   public static void finishMetadataResponseBuffer(FlatBufferBuilder builder, int offset) { builder.finish(offset); }
   public static void finishSizePrefixedMetadataResponseBuffer(FlatBufferBuilder builder, int offset) { builder.finishSizePrefixed(offset); }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TableMeta.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TableMeta.java
similarity index 84%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TableMeta.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TableMeta.java
index 03b37241215..f8ce12ec918 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TableMeta.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TableMeta.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -58,4 +74,3 @@ public static int endTableMeta(FlatBufferBuilder builder) {
     return o;
   }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferRequest.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferRequest.java
similarity index 83%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferRequest.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferRequest.java
index 4cb5a2f2547..58f8f838906 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferRequest.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferRequest.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -50,4 +66,3 @@ public static int endTransferRequest(FlatBufferBuilder builder) {
   public static void finishTransferRequestBuffer(FlatBufferBuilder builder, int offset) { builder.finish(offset); }
   public static void finishSizePrefixedTransferRequestBuffer(FlatBufferBuilder builder, int offset) { builder.finishSizePrefixed(offset); }
 }
-
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferResponse.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferResponse.java
similarity index 81%
rename from sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferResponse.java
rename to sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferResponse.java
index b1a03c05ba3..208cceb04ff 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferResponse.java
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferResponse.java
@@ -1,3 +1,19 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
 // automatically generated by the FlatBuffers compiler, do not modify
 
 package com.nvidia.spark.rapids.format;
@@ -42,4 +58,3 @@ public static int endTransferResponse(FlatBufferBuilder builder) {
   public static void finishTransferResponseBuffer(FlatBufferBuilder builder, int offset) { builder.finish(offset); }
   public static void finishSizePrefixedTransferResponseBuffer(FlatBufferBuilder builder, int offset) { builder.finishSizePrefixed(offset); }
 }
-
diff --git a/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferState.java b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferState.java
new file mode 100644
index 00000000000..41dad2caa6e
--- /dev/null
+++ b/sql-plugin-format/src/main/java/com/nvidia/spark/rapids/format/TransferState.java
@@ -0,0 +1,35 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+// automatically generated by the FlatBuffers compiler, do not modify
+
+package com.nvidia.spark.rapids.format;
+
+public final class TransferState {
+  private TransferState() { }
+  /**
+   * UCX transfer initiated on sender-side
+   */
+  public static final byte STARTED = 0;
+  /**
+   * Data has been compressed and requires meta update
+   */
+  public static final byte BUFFER_META_UPDATED = 1;
+
+  public static final String[] names = { "STARTED", "BUFFER_META_UPDATED", };
+
+  public static String name(int e) { return names[e]; }
+}
diff --git a/sql-plugin-shims/pom.xml b/sql-plugin-shims/pom.xml
new file mode 100644
index 00000000000..b1f200b2356
--- /dev/null
+++ b/sql-plugin-shims/pom.xml
@@ -0,0 +1,68 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Copyright (c) 2026, NVIDIA CORPORATION.
+
+  Licensed under the Apache License, Version 2.0 (the "License");
+  you may not use this file except in compliance with the License.
+  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"
+         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
+    <modelVersion>4.0.0</modelVersion>
+
+    <parent>
+        <groupId>com.nvidia</groupId>
+        <artifactId>rapids-4-spark-shim-deps-parent_2.12</artifactId>
+        <version>26.08.0-SNAPSHOT</version>
+        <relativePath>../shim-deps/pom.xml</relativePath>
+    </parent>
+    <artifactId>rapids-4-spark-sql-shims_2.12</artifactId>
+    <name>RAPIDS Accelerator for Apache Spark SQL Plugin Shims</name>
+    <description>Compile-time isolated SQL plugin shims</description>
+    <version>26.08.0-SNAPSHOT</version>
+
+    <properties>
+        <rapids.module>sql-plugin-shims</rapids.module>
+        <rapids.compressed.artifact>false</rapids.compressed.artifact>
+        <rapids.default.jar.excludePattern>**/*</rapids.default.jar.excludePattern>
+        <rapids.shim.jar.phase>package</rapids.shim.jar.phase>
+    </properties>
+
+    <dependencies>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-api_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>org.scala-lang</groupId>
+            <artifactId>scala-library</artifactId>
+        </dependency>
+    </dependencies>
+
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>net.alchim31.maven</groupId>
+                <artifactId>scala-maven-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <artifactId>maven-antrun-plugin</artifactId>
+            </plugin>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+            </plugin>
+        </plugins>
+    </build>
+</project>
diff --git a/sql-plugin-shims/src/main/scala/org/apache/spark/sql/errors/ConvUtils.scala b/sql-plugin-shims/src/main/scala/org/apache/spark/sql/errors/ConvUtils.scala
new file mode 100644
index 00000000000..abd23b7f158
--- /dev/null
+++ b/sql-plugin-shims/src/main/scala/org/apache/spark/sql/errors/ConvUtils.scala
@@ -0,0 +1,40 @@
+/*
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.spark.sql.errors
+
+import java.lang.reflect.InvocationTargetException
+
+object ConvUtils {
+  private val queryExecutionErrorsCompanion =
+    "org.apache.spark.sql.errors.QueryExecutionErrors$"
+
+  def overflowInConvError(): Unit = {
+    try {
+      val companion = Class.forName(queryExecutionErrorsCompanion).getField("MODULE$").get(null)
+      val method = companion.getClass.getMethods.find { method =>
+        method.getName == "overflowInConvError" && method.getParameterCount == 1
+      }.getOrElse {
+        throw new UnsupportedOperationException()
+      }
+      throw method.invoke(companion, null.asInstanceOf[AnyRef]).asInstanceOf[Throwable]
+    } catch {
+      case _: ClassNotFoundException | _: NoSuchFieldException =>
+        throw new UnsupportedOperationException()
+      case e: InvocationTargetException =>
+        throw e.getCause
+    }
+  }
+}
diff --git a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala b/sql-plugin-shims/src/main/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala
similarity index 65%
rename from sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala
rename to sql-plugin-shims/src/main/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala
index 6de8f1d6165..a68f2d6bafd 100644
--- a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala
+++ b/sql-plugin-shims/src/main/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala
@@ -14,24 +14,29 @@
  * limitations under the License.
  */
 
-/*** spark-rapids-shim-json-lines
-{"spark": "400"}
-{"spark": "400db173"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
 package org.apache.spark.sql.rapids.shims
 
-import org.apache.spark.sql.classic.SparkSession
+import java.lang.reflect.InvocationTargetException
+
+import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.execution.SparkPlan
 
 object SparkSessionUtils {
+
   def sessionFromPlan(plan: SparkPlan): SparkSession = {
-    plan.session
+    invokeNoArg(plan, "session").asInstanceOf[SparkSession]
   }
 
   def leafNodeDefaultParallelism(ss: SparkSession): Int = {
-    ss.leafNodeDefaultParallelism
+    invokeNoArg(ss, "leafNodeDefaultParallelism").asInstanceOf[Int]
+  }
+
+  private def invokeNoArg(target: AnyRef, methodName: String): AnyRef = {
+    try {
+      target.getClass.getMethod(methodName).invoke(target)
+    } catch {
+      case e: InvocationTargetException =>
+        throw e.getCause
+    }
   }
 }
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala b/sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/CreateDataSourceTableAsSelectRules.scala
similarity index 62%
rename from sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
rename to sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/CreateDataSourceTableAsSelectRules.scala
index 5e2a2eac009..6e7f9d737ed 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
+++ b/sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/CreateDataSourceTableAsSelectRules.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ * Copyright (c) 2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -16,6 +16,7 @@
 
 /*** spark-rapids-shim-json-lines
 {"spark": "330"}
+{"spark": "330db"}
 {"spark": "331"}
 {"spark": "332"}
 {"spark": "333"}
@@ -23,15 +24,12 @@
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
-import org.apache.spark.sql.catalyst.expressions.Expression
+import com.nvidia.spark.rapids.ShimDataWritingCommandRule
 
-object TryModeShim {
-  /**
-   * Expression is wrapped under TryEval during query planning which is not supported on GPU.
-   * Example: for try_add(col1, col2) it would be <TryEval> tryeval((col1#0 + col2#1))
-   * So the return value from this function does not matter.
-   */
-  def isTryMode(expr: Expression): Boolean = {
-    false
-  }
+import org.apache.spark.sql.execution.command.CreateDataSourceTableAsSelectCommand
+
+object CreateDataSourceTableAsSelectRules {
+  val dataWriteCmd: ShimDataWritingCommandRule[CreateDataSourceTableAsSelectCommand] =
+    ShimDataWritingCommandRule[CreateDataSourceTableAsSelectCommand](
+      "Create table with select command")
 }
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SequenceSizeTooLongErrorBuilder.scala b/sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SequenceSizeTooLongErrorBuilder.scala
similarity index 100%
rename from sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SequenceSizeTooLongErrorBuilder.scala
rename to sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SequenceSizeTooLongErrorBuilder.scala
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/spark330/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/spark330/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/spark330/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/spark330/SparkShimServiceProvider.scala
index e50335d71a8..4e209fe7450 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/spark330/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark330/scala/com/nvidia/spark/rapids/shims/spark330/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala b/sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala
rename to sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala b/sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala
rename to sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala b/sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
similarity index 100%
rename from sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
rename to sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala b/sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
similarity index 96%
rename from sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
rename to sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
index 960384cd4e9..b0cab9169e4 100644
--- a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
+++ b/sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala b/sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala
rename to sql-plugin-shims/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/storage/ShuffleClientShims.scala b/sql-plugin-shims/src/main/spark330/scala/org/apache/spark/storage/ShuffleClientShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark330/scala/org/apache/spark/storage/ShuffleClientShims.scala
rename to sql-plugin-shims/src/main/spark330/scala/org/apache/spark/storage/ShuffleClientShims.scala
diff --git a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/DatabricksShimServiceProvider.scala b/sql-plugin-shims/src/main/spark330db/scala/com/nvidia/spark/rapids/DatabricksShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/DatabricksShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark330db/scala/com/nvidia/spark/rapids/DatabricksShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/spark330db/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/spark330db/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/spark330db/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/spark330db/SparkShimServiceProvider.scala
index 0db1385cda5..149c45b7dab 100644
--- a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/spark330db/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/spark330db/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala b/sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
similarity index 100%
rename from sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
rename to sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
diff --git a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala b/sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
similarity index 95%
rename from sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
rename to sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
index 4f59c12c985..a33ac76fdc5 100644
--- a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
+++ b/sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala b/sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
similarity index 96%
rename from sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
rename to sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
index 2ae55c73057..feedbd11cf9 100644
--- a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
+++ b/sql-plugin-shims/src/main/spark330db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/spark331/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark331/scala/com/nvidia/spark/rapids/shims/spark331/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/spark331/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark331/scala/com/nvidia/spark/rapids/shims/spark331/SparkShimServiceProvider.scala
index db631bdfb63..0483b4ffc1d 100644
--- a/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/spark331/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark331/scala/com/nvidia/spark/rapids/shims/spark331/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark332/scala/com/nvidia/spark/rapids/shims/spark332/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark332/scala/com/nvidia/spark/rapids/shims/spark332/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark332/scala/com/nvidia/spark/rapids/shims/spark332/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark332/scala/com/nvidia/spark/rapids/shims/spark332/SparkShimServiceProvider.scala
index 06be70cb21b..57403b1848a 100644
--- a/sql-plugin/src/main/spark332/scala/com/nvidia/spark/rapids/shims/spark332/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark332/scala/com/nvidia/spark/rapids/shims/spark332/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark340/scala/org/apache/spark/sql/errors/ConvUtils.scala b/sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/CreateDataSourceTableAsSelectRules.scala
similarity index 68%
rename from sql-plugin/src/main/spark340/scala/org/apache/spark/sql/errors/ConvUtils.scala
rename to sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/CreateDataSourceTableAsSelectRules.scala
index d9a669771a4..704c5188af0 100644
--- a/sql-plugin/src/main/spark340/scala/org/apache/spark/sql/errors/ConvUtils.scala
+++ b/sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/CreateDataSourceTableAsSelectRules.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ * Copyright (c) 2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -15,6 +15,7 @@
  */
 
 /*** spark-rapids-shim-json-lines
+{"spark": "332db"}
 {"spark": "340"}
 {"spark": "341"}
 {"spark": "341db"}
@@ -37,8 +38,14 @@
 {"spark": "402"}
 {"spark": "411"}
 spark-rapids-shim-json-lines ***/
-package org.apache.spark.sql.errors
+package com.nvidia.spark.rapids.shims
 
-object ConvUtils {
-  def overflowInConvError(): Unit = throw QueryExecutionErrors.overflowInConvError(null)
+import com.nvidia.spark.rapids.ShimRunnableCommandRule
+
+import org.apache.spark.sql.execution.command.CreateDataSourceTableAsSelectCommand
+
+object CreateDataSourceTableAsSelectRules {
+  val runnableCmd: ShimRunnableCommandRule[CreateDataSourceTableAsSelectCommand] =
+    ShimRunnableCommandRule[CreateDataSourceTableAsSelectCommand](
+      "Write to a data source")
 }
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala b/sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/WriteFilesExecShims.scala
similarity index 81%
rename from sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala
rename to sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/WriteFilesExecShims.scala
index 21cf24ddfc2..f320286ff58 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala
+++ b/sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/WriteFilesExecShims.scala
@@ -15,13 +15,7 @@
  */
 
 /*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
 {"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
 {"spark": "340"}
 {"spark": "341"}
 {"spark": "341db"}
@@ -42,9 +36,14 @@
 {"spark": "400db173"}
 {"spark": "401"}
 {"spark": "402"}
+{"spark": "411"}
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
-object BloomFilterConstantsShims {
-  val BLOOM_FILTER_FORMAT_VERSION: Int = 1
+import com.nvidia.spark.rapids.ShimExecRule
+
+import org.apache.spark.sql.execution.datasources.WriteFilesExec
+
+object WriteFilesExecShims {
+  val exec: ShimExecRule[WriteFilesExec] = ShimExecRule[WriteFilesExec]("v1 write files")
 }
diff --git a/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/spark332db/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/spark332db/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/spark332db/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/spark332db/SparkShimServiceProvider.scala
index be448c2d4ba..4af95229ee3 100644
--- a/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/spark332db/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/spark332db/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala b/sql-plugin-shims/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
rename to sql-plugin-shims/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkDateTimeExceptionShims.scala
diff --git a/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala b/sql-plugin-shims/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
rename to sql-plugin-shims/src/main/spark332db/scala/org/apache/spark/sql/rapids/shims/SparkUpgradeExceptionShims.scala
diff --git a/sql-plugin/src/main/spark333/scala/com/nvidia/spark/rapids/shims/spark333/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark333/scala/com/nvidia/spark/rapids/shims/spark333/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark333/scala/com/nvidia/spark/rapids/shims/spark333/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark333/scala/com/nvidia/spark/rapids/shims/spark333/SparkShimServiceProvider.scala
index f329546de6a..a1c902dcbb6 100644
--- a/sql-plugin/src/main/spark333/scala/com/nvidia/spark/rapids/shims/spark333/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark333/scala/com/nvidia/spark/rapids/shims/spark333/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark334/scala/com/nvidia/spark/rapids/shims/spark334/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark334/scala/com/nvidia/spark/rapids/shims/spark334/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark334/scala/com/nvidia/spark/rapids/shims/spark334/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark334/scala/com/nvidia/spark/rapids/shims/spark334/SparkShimServiceProvider.scala
index 9742399c693..f917857bd36 100644
--- a/sql-plugin/src/main/spark334/scala/com/nvidia/spark/rapids/shims/spark334/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark334/scala/com/nvidia/spark/rapids/shims/spark334/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark334/scala/org/apache/spark/sql/rapids/shims/SequenceSizeTooLongUnsuccessfulErrorBuilder.scala b/sql-plugin-shims/src/main/spark334/scala/org/apache/spark/sql/rapids/shims/SequenceSizeTooLongUnsuccessfulErrorBuilder.scala
similarity index 96%
rename from sql-plugin/src/main/spark334/scala/org/apache/spark/sql/rapids/shims/SequenceSizeTooLongUnsuccessfulErrorBuilder.scala
rename to sql-plugin-shims/src/main/spark334/scala/org/apache/spark/sql/rapids/shims/SequenceSizeTooLongUnsuccessfulErrorBuilder.scala
index b7b01b388b9..c2530d5d1c8 100644
--- a/sql-plugin/src/main/spark334/scala/org/apache/spark/sql/rapids/shims/SequenceSizeTooLongUnsuccessfulErrorBuilder.scala
+++ b/sql-plugin-shims/src/main/spark334/scala/org/apache/spark/sql/rapids/shims/SequenceSizeTooLongUnsuccessfulErrorBuilder.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/spark340/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark340/scala/com/nvidia/spark/rapids/shims/spark340/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/spark340/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark340/scala/com/nvidia/spark/rapids/shims/spark340/SparkShimServiceProvider.scala
index 23581ba9a28..38694beb937 100644
--- a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/spark340/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark340/scala/com/nvidia/spark/rapids/shims/spark340/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark340/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala b/sql-plugin-shims/src/main/spark340/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
similarity index 100%
rename from sql-plugin/src/main/spark340/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
rename to sql-plugin-shims/src/main/spark340/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
diff --git a/sql-plugin/src/main/spark341/scala/com/nvidia/spark/rapids/shims/spark341/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark341/scala/com/nvidia/spark/rapids/shims/spark341/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark341/scala/com/nvidia/spark/rapids/shims/spark341/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark341/scala/com/nvidia/spark/rapids/shims/spark341/SparkShimServiceProvider.scala
index 38f9fd0307f..9c9c844145d 100644
--- a/sql-plugin/src/main/spark341/scala/com/nvidia/spark/rapids/shims/spark341/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark341/scala/com/nvidia/spark/rapids/shims/spark341/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/spark341db/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/spark341db/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/spark341db/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/spark341db/SparkShimServiceProvider.scala
index 72ed2c7c067..6c607615c7d 100644
--- a/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/spark341db/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/spark341db/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark342/scala/com/nvidia/spark/rapids/shims/spark342/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark342/scala/com/nvidia/spark/rapids/shims/spark342/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark342/scala/com/nvidia/spark/rapids/shims/spark342/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark342/scala/com/nvidia/spark/rapids/shims/spark342/SparkShimServiceProvider.scala
index 6b00a7a762e..7833fc477c6 100644
--- a/sql-plugin/src/main/spark342/scala/com/nvidia/spark/rapids/shims/spark342/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark342/scala/com/nvidia/spark/rapids/shims/spark342/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark343/scala/com/nvidia/spark/rapids/shims/spark343/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark343/scala/com/nvidia/spark/rapids/shims/spark343/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark343/scala/com/nvidia/spark/rapids/shims/spark343/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark343/scala/com/nvidia/spark/rapids/shims/spark343/SparkShimServiceProvider.scala
index ff35d06a9c7..dc028c33f24 100644
--- a/sql-plugin/src/main/spark343/scala/com/nvidia/spark/rapids/shims/spark343/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark343/scala/com/nvidia/spark/rapids/shims/spark343/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark344/scala/com/nvidia/spark/rapids/shims/spark344/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark344/scala/com/nvidia/spark/rapids/shims/spark344/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark344/scala/com/nvidia/spark/rapids/shims/spark344/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark344/scala/com/nvidia/spark/rapids/shims/spark344/SparkShimServiceProvider.scala
index 80f042e0ee7..13fd8106a47 100644
--- a/sql-plugin/src/main/spark344/scala/com/nvidia/spark/rapids/shims/spark344/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark344/scala/com/nvidia/spark/rapids/shims/spark344/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/spark350/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark350/scala/com/nvidia/spark/rapids/shims/spark350/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/spark350/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark350/scala/com/nvidia/spark/rapids/shims/spark350/SparkShimServiceProvider.scala
index 91fcf7cf40a..c70f14547d1 100644
--- a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/spark350/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark350/scala/com/nvidia/spark/rapids/shims/spark350/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark350db143/scala/com/nvidia/spark/rapids/shims/spark350db143/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark350db143/scala/com/nvidia/spark/rapids/shims/spark350db143/SparkShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark350db143/scala/com/nvidia/spark/rapids/shims/spark350db143/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark350db143/scala/com/nvidia/spark/rapids/shims/spark350db143/SparkShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark350db143/scala/org/apache/spark/sql/rapids/shims/SequenceSizeExceededLimitErrorBuilder.scala b/sql-plugin-shims/src/main/spark350db143/scala/org/apache/spark/sql/rapids/shims/SequenceSizeExceededLimitErrorBuilder.scala
similarity index 100%
rename from sql-plugin/src/main/spark350db143/scala/org/apache/spark/sql/rapids/shims/SequenceSizeExceededLimitErrorBuilder.scala
rename to sql-plugin-shims/src/main/spark350db143/scala/org/apache/spark/sql/rapids/shims/SequenceSizeExceededLimitErrorBuilder.scala
diff --git a/sql-plugin/src/main/spark351/scala/com/nvidia/spark/rapids/shims/spark351/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark351/scala/com/nvidia/spark/rapids/shims/spark351/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark351/scala/com/nvidia/spark/rapids/shims/spark351/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark351/scala/com/nvidia/spark/rapids/shims/spark351/SparkShimServiceProvider.scala
index 8b1bace8aa1..a1a1f5a51a9 100644
--- a/sql-plugin/src/main/spark351/scala/com/nvidia/spark/rapids/shims/spark351/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark351/scala/com/nvidia/spark/rapids/shims/spark351/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark352/scala/com/nvidia/spark/rapids/shims/spark352/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark352/scala/com/nvidia/spark/rapids/shims/spark352/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark352/scala/com/nvidia/spark/rapids/shims/spark352/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark352/scala/com/nvidia/spark/rapids/shims/spark352/SparkShimServiceProvider.scala
index 5a6ba4d43c9..a6cb8368ba2 100644
--- a/sql-plugin/src/main/spark352/scala/com/nvidia/spark/rapids/shims/spark352/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark352/scala/com/nvidia/spark/rapids/shims/spark352/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark353/scala/com/nvidia/spark/rapids/shims/spark353/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark353/scala/com/nvidia/spark/rapids/shims/spark353/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark353/scala/com/nvidia/spark/rapids/shims/spark353/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark353/scala/com/nvidia/spark/rapids/shims/spark353/SparkShimServiceProvider.scala
index 8eaf51f7177..2945458b56f 100644
--- a/sql-plugin/src/main/spark353/scala/com/nvidia/spark/rapids/shims/spark353/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark353/scala/com/nvidia/spark/rapids/shims/spark353/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark354/scala/com/nvidia/spark/rapids/shims/spark354/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark354/scala/com/nvidia/spark/rapids/shims/spark354/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark354/scala/com/nvidia/spark/rapids/shims/spark354/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark354/scala/com/nvidia/spark/rapids/shims/spark354/SparkShimServiceProvider.scala
index 46d9887b0c8..7002ba891cd 100644
--- a/sql-plugin/src/main/spark354/scala/com/nvidia/spark/rapids/shims/spark354/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark354/scala/com/nvidia/spark/rapids/shims/spark354/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark355/scala/com/nvidia/spark/rapids/shims/spark355/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark355/scala/com/nvidia/spark/rapids/shims/spark355/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark355/scala/com/nvidia/spark/rapids/shims/spark355/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark355/scala/com/nvidia/spark/rapids/shims/spark355/SparkShimServiceProvider.scala
index 7175d0eb948..776871d176c 100644
--- a/sql-plugin/src/main/spark355/scala/com/nvidia/spark/rapids/shims/spark355/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark355/scala/com/nvidia/spark/rapids/shims/spark355/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark356/scala/com/nvidia/spark/rapids/shims/spark356/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark356/scala/com/nvidia/spark/rapids/shims/spark356/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark356/scala/com/nvidia/spark/rapids/shims/spark356/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark356/scala/com/nvidia/spark/rapids/shims/spark356/SparkShimServiceProvider.scala
index 9f55ea238cd..f9ce0d6aeee 100644
--- a/sql-plugin/src/main/spark356/scala/com/nvidia/spark/rapids/shims/spark356/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark356/scala/com/nvidia/spark/rapids/shims/spark356/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark357/scala/com/nvidia/spark/rapids/shims/spark357/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark357/scala/com/nvidia/spark/rapids/shims/spark357/SparkShimServiceProvider.scala
similarity index 96%
rename from sql-plugin/src/main/spark357/scala/com/nvidia/spark/rapids/shims/spark357/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark357/scala/com/nvidia/spark/rapids/shims/spark357/SparkShimServiceProvider.scala
index 971678a51bf..bd376eee633 100644
--- a/sql-plugin/src/main/spark357/scala/com/nvidia/spark/rapids/shims/spark357/SparkShimServiceProvider.scala
+++ b/sql-plugin-shims/src/main/spark357/scala/com/nvidia/spark/rapids/shims/spark357/SparkShimServiceProvider.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
diff --git a/sql-plugin/src/main/spark358/scala/com/nvidia/spark/rapids/shims/spark358/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark358/scala/com/nvidia/spark/rapids/shims/spark358/SparkShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark358/scala/com/nvidia/spark/rapids/shims/spark358/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark358/scala/com/nvidia/spark/rapids/shims/spark358/SparkShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/spark400/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark400/scala/com/nvidia/spark/rapids/shims/spark400/SparkShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/spark400/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark400/scala/com/nvidia/spark/rapids/shims/spark400/SparkShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala b/sql-plugin-shims/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
similarity index 100%
rename from sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
rename to sql-plugin-shims/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/OriginContextShim.scala
diff --git a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala b/sql-plugin-shims/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala
rename to sql-plugin-shims/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/TrampolineConnectShims.scala
diff --git a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/spark400db173/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/spark400db173/SparkShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/spark400db173/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/spark400db173/SparkShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark400db173/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala b/sql-plugin-shims/src/main/spark400db173/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark400db173/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala
rename to sql-plugin-shims/src/main/spark400db173/scala/org/apache/spark/sql/rapids/ShuffleManagerShims.scala
diff --git a/sql-plugin/src/main/spark400db173/scala/org/apache/spark/storage/ShuffleClientShims.scala b/sql-plugin-shims/src/main/spark400db173/scala/org/apache/spark/storage/ShuffleClientShims.scala
similarity index 99%
rename from sql-plugin/src/main/spark400db173/scala/org/apache/spark/storage/ShuffleClientShims.scala
rename to sql-plugin-shims/src/main/spark400db173/scala/org/apache/spark/storage/ShuffleClientShims.scala
index aedfb30f7e9..12a6ac402df 100644
--- a/sql-plugin/src/main/spark400db173/scala/org/apache/spark/storage/ShuffleClientShims.scala
+++ b/sql-plugin-shims/src/main/spark400db173/scala/org/apache/spark/storage/ShuffleClientShims.scala
@@ -34,4 +34,3 @@ object ShuffleClientShims {
     client.diagnoseCorruption(host, port, execId, blockId.name, checksum, algorithm)
   }
 }
-
diff --git a/sql-plugin/src/main/spark401/scala/com/nvidia/spark/rapids/shims/spark401/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark401/scala/com/nvidia/spark/rapids/shims/spark401/SparkShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark401/scala/com/nvidia/spark/rapids/shims/spark401/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark401/scala/com/nvidia/spark/rapids/shims/spark401/SparkShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark402/scala/com/nvidia/spark/rapids/shims/spark402/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark402/scala/com/nvidia/spark/rapids/shims/spark402/SparkShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark402/scala/com/nvidia/spark/rapids/shims/spark402/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark402/scala/com/nvidia/spark/rapids/shims/spark402/SparkShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/spark411/SparkShimServiceProvider.scala b/sql-plugin-shims/src/main/spark411/scala/com/nvidia/spark/rapids/shims/spark411/SparkShimServiceProvider.scala
similarity index 100%
rename from sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/spark411/SparkShimServiceProvider.scala
rename to sql-plugin-shims/src/main/spark411/scala/com/nvidia/spark/rapids/shims/spark411/SparkShimServiceProvider.scala
diff --git a/sql-plugin/src/main/spark411/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala b/sql-plugin-shims/src/main/spark411/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala
similarity index 100%
rename from sql-plugin/src/main/spark411/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala
rename to sql-plugin-shims/src/main/spark411/scala/org/apache/spark/sql/rapids/shims/FileCommitProtocolShims.scala
diff --git a/sql-plugin/pom.xml b/sql-plugin/pom.xml
index de478137c32..42de0833323 100644
--- a/sql-plugin/pom.xml
+++ b/sql-plugin/pom.xml
@@ -54,12 +54,37 @@
             <version>${spark-rapids-private.version}</version>
             <classifier>${spark.version.classifier}</classifier>
         </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-format_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-fileio_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-plugin-columnar_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+        </dependency>
         <dependency>
             <groupId>com.nvidia</groupId>
             <artifactId>rapids-4-spark-sql-plugin-api_${scala.binary.version}</artifactId>
             <version>${project.version}</version>
             <classifier>${spark.version.classifier}</classifier>
         </dependency>
+        <dependency>
+            <groupId>com.nvidia</groupId>
+            <artifactId>rapids-4-spark-sql-shims_${scala.binary.version}</artifactId>
+            <version>${project.version}</version>
+            <classifier>${spark.version.classifier}</classifier>
+            <scope>provided</scope>
+        </dependency>
         <dependency>
             <groupId>org.scala-lang</groupId>
             <artifactId>scala-library</artifactId>
@@ -219,6 +244,27 @@
                 <groupId>net.alchim31.maven</groupId>
                 <artifactId>scala-maven-plugin</artifactId>
             </plugin>
+            <plugin>
+                <groupId>org.apache.maven.plugins</groupId>
+                <artifactId>maven-dependency-plugin</artifactId>
+                <version>3.6.1</version>
+                <executions>
+                    <execution>
+                        <id>unpack-sql-plugin-shims</id>
+                        <phase>prepare-package</phase>
+                        <goals>
+                            <goal>unpack-dependencies</goal>
+                        </goals>
+                        <configuration>
+                            <includeGroupIds>com.nvidia</includeGroupIds>
+                            <includeArtifactIds>rapids-4-spark-sql-shims_${scala.binary.version}</includeArtifactIds>
+                            <excludeTransitive>true</excludeTransitive>
+                            <includes>**/*.class</includes>
+                            <outputDirectory>${project.build.outputDirectory}</outputDirectory>
+                        </configuration>
+                    </execution>
+                </executions>
+            </plugin>
             <plugin>
                 <groupId>org.apache.rat</groupId>
                 <artifactId>apache-rat-plugin</artifactId>
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/InternalRowToColumnarBatchIterator.java b/sql-plugin/src/main/java/com/nvidia/spark/rapids/InternalRowToColumnarBatchIterator.java
index 400b54626d8..dbf27a96c41 100644
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/InternalRowToColumnarBatchIterator.java
+++ b/sql-plugin/src/main/java/com/nvidia/spark/rapids/InternalRowToColumnarBatchIterator.java
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -228,7 +228,7 @@ private HostMemoryBuffer[] getHostBuffersWithRetry(
     try {
       hBuf = HostAlloc$.MODULE$.alloc((dataBytes + offsetBytes),true);
       SpillableHostBuffer sBuf = SpillableHostBuffer$.MODULE$.apply(hBuf, hBuf.getLength(),
-          SpillPriorities$.MODULE$.ACTIVE_ON_DECK_PRIORITY());
+          SpillPriorities.ACTIVE_ON_DECK_PRIORITY);
       hBuf = null;  // taken over by spillable host buffer
       return Tuple2.apply(sBuf, numRowsWrapper);
     } finally {
@@ -258,7 +258,7 @@ private SpillableColumnarBatch makeSpillableBatch(ColumnVector devColumn) {
         new ColumnarBatch(
             new org.apache.spark.sql.vectorized.ColumnVector[]{gpuCV},
             (int)gpuCV.getRowCount()),
-        SpillPriorities.ACTIVE_ON_DECK_PRIORITY());
+        SpillPriorities.ACTIVE_ON_DECK_PRIORITY);
   }
 
   /**
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/SpillableKudoTable.java b/sql-plugin/src/main/java/com/nvidia/spark/rapids/SpillableKudoTable.java
new file mode 100644
index 00000000000..a2585829858
--- /dev/null
+++ b/sql-plugin/src/main/java/com/nvidia/spark/rapids/SpillableKudoTable.java
@@ -0,0 +1,67 @@
+/*
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+import com.nvidia.spark.rapids.jni.kudo.KudoTable;
+import com.nvidia.spark.rapids.jni.kudo.KudoTableHeader;
+
+public class SpillableKudoTable implements AutoCloseable {
+  public final KudoTableHeader header;
+  public final long length;
+  private final SpillableHostBuffer shb;
+
+  public SpillableKudoTable(KudoTableHeader header, long length, SpillableHostBuffer shb) {
+    this.header = header;
+    this.length = length;
+    this.shb = shb;
+  }
+
+  public static SpillableKudoTable from(KudoTableHeader header, HostMemoryBuffer buffer) {
+    if (buffer == null) {
+      return new SpillableKudoTable(header, 0, null);
+    } else {
+      return new SpillableKudoTable(
+          header,
+          buffer.getLength(),
+          SpillableHostBuffer.apply(
+              buffer,
+              buffer.getLength(),
+              SpillPriorities.ACTIVE_BATCHING_PRIORITY));
+    }
+  }
+
+  public KudoTable makeKudoTable() {
+    if (shb == null) {
+      return new KudoTable(header, null);
+    } else {
+      return new KudoTable(header, shb.getHostBuffer());
+    }
+  }
+
+  @Override
+  public String toString() {
+    return "SpillableKudoTable{header=" + header + ", shb=" + shb + '}';
+  }
+
+  @Override
+  public void close() {
+    if (shb != null) {
+      shb.close();
+    }
+  }
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/RapidsInputFiles.java b/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/RapidsInputFiles.java
deleted file mode 100644
index e30bbce09b3..00000000000
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/RapidsInputFiles.java
+++ /dev/null
@@ -1,41 +0,0 @@
-/*
- * Copyright (c) 2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids.fileio;
-
-import com.nvidia.spark.rapids.PerfIOConf;
-import org.apache.spark.SparkEnv;
-
-/**
- * Static helpers shared by {@link com.nvidia.spark.rapids.jni.fileio.RapidsInputFile}
- * implementations.
- */
-public final class RapidsInputFiles {
-    private RapidsInputFiles() {}
-
-    /**
-     * True iff {@code spark.rapids.perfio.s3.enabled} is set to {@code true} on
-     * the active SparkConf. Returns false when no {@link SparkEnv} is initialized
-     * (e.g. before driver bring-up) so callers default to the non-PerfIO path.
-     */
-    public static boolean isS3PerfEnabled() {
-        SparkEnv env = SparkEnv.get();
-        if (env == null) {
-            return false;
-        }
-        return env.conf().getBoolean(PerfIOConf.S3PERF_ENABLED().key(), false);
-    }
-}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/PerfIOS3Reader.java b/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/PerfIOS3Reader.java
new file mode 100644
index 00000000000..5277c382ee0
--- /dev/null
+++ b/sql-plugin/src/main/java/com/nvidia/spark/rapids/fileio/hadoop/PerfIOS3Reader.java
@@ -0,0 +1,90 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.fileio.hadoop;
+
+import ai.rapids.cudf.HostMemoryBuffer;
+import com.nvidia.spark.rapids.IntRangeWithOffset;
+import com.nvidia.spark.rapids.PerfIO$;
+import com.nvidia.spark.rapids.PerfIOConf;
+import com.nvidia.spark.rapids.RangeWithOffset;
+import com.nvidia.spark.rapids.SuffixRangeWithOffset;
+import com.nvidia.spark.rapids.fileio.RapidsInputFiles.S3PerfReader;
+import com.nvidia.spark.rapids.jni.fileio.RapidsInputFile;
+import org.apache.hadoop.conf.Configuration;
+import org.apache.spark.SparkEnv;
+import scala.Option;
+import scala.collection.JavaConverters;
+
+import java.io.IOException;
+import java.net.URI;
+import java.util.ArrayList;
+import java.util.List;
+
+/** SQL-plugin bridge from Java-only file I/O classes to private Scala PerfIO state. */
+public final class PerfIOS3Reader implements S3PerfReader {
+    public static final PerfIOS3Reader INSTANCE = new PerfIOS3Reader();
+
+    private PerfIOS3Reader() {}
+
+    @Override
+    public boolean isEnabled() {
+        SparkEnv env = SparkEnv.get();
+        if (env == null) {
+            return false;
+        }
+        return env.conf().getBoolean(PerfIOConf.S3PERF_ENABLED().key(), false);
+    }
+
+    @Override
+    public boolean readVectored(
+            Configuration hadoopConf,
+            URI fileUri,
+            HostMemoryBuffer output,
+            List<RapidsInputFile.CopyRange> copyRanges) throws IOException {
+        List<RangeWithOffset> ranges = new ArrayList<>(copyRanges.size());
+        for (RapidsInputFile.CopyRange range : copyRanges) {
+            ranges.add(new IntRangeWithOffset(
+                    range.getInputOffset(), range.getLength(), range.getOutputOffset()));
+        }
+        return readToHostMemory(hadoopConf, fileUri, output, ranges);
+    }
+
+    @Override
+    public boolean readTail(
+            Configuration hadoopConf,
+            URI fileUri,
+            HostMemoryBuffer output,
+            long length,
+            long outputOffset) throws IOException {
+        List<RangeWithOffset> ranges = new ArrayList<>(1);
+        ranges.add(new SuffixRangeWithOffset(length, outputOffset));
+        return readToHostMemory(hadoopConf, fileUri, output, ranges);
+    }
+
+    private boolean readToHostMemory(
+            Configuration hadoopConf,
+            URI fileUri,
+            HostMemoryBuffer output,
+            List<RangeWithOffset> ranges) {
+        Option<Object> result = PerfIO$.MODULE$.readToHostMemory(
+                hadoopConf,
+                output,
+                fileUri,
+                () -> JavaConverters.asScalaBufferConverter(ranges).asScala().toSeq());
+        return result.isDefined();
+    }
+}
diff --git a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferState.java b/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferState.java
deleted file mode 100644
index 0fd00abac9b..00000000000
--- a/sql-plugin/src/main/java/com/nvidia/spark/rapids/format/TransferState.java
+++ /dev/null
@@ -1,20 +0,0 @@
-// automatically generated by the FlatBuffers compiler, do not modify
-
-package com.nvidia.spark.rapids.format;
-
-public final class TransferState {
-  private TransferState() { }
-  /**
-   * UCX transfer initiated on sender-side
-   */
-  public static final byte STARTED = 0;
-  /**
-   * Data has been compressed and requires meta update
-   */
-  public static final byte BUFFER_META_UPDATED = 1;
-
-  public static final String[] names = { "STARTED", "BUFFER_META_UPDATED", };
-
-  public static String name(int e) { return names[e]; }
-}
-
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/FunctionsImpl.scala b/sql-plugin/src/main/scala/com/nvidia/spark/FunctionsImpl.scala
index 7c27cb79054..54b47384466 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/FunctionsImpl.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/FunctionsImpl.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -35,7 +35,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function0[Column]): UserDefinedFunction =
-    sp_udf(DFUDF0(f), LongType)
+    sp_udf(new DFUDF0(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -43,7 +43,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function1[Column, Column]): UserDefinedFunction =
-    sp_udf(DFUDF1(f), LongType)
+    sp_udf(new DFUDF1(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -51,7 +51,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function2[Column, Column, Column]): UserDefinedFunction =
-    sp_udf(DFUDF2(f), LongType)
+    sp_udf(new DFUDF2(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -59,7 +59,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function3[Column, Column, Column, Column]): UserDefinedFunction =
-    sp_udf(DFUDF3(f), LongType)
+    sp_udf(new DFUDF3(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -67,7 +67,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function4[Column, Column, Column, Column, Column]): UserDefinedFunction =
-    sp_udf(DFUDF4(f), LongType)
+    sp_udf(new DFUDF4(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -75,7 +75,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function5[Column, Column, Column, Column, Column,
-    Column]): UserDefinedFunction = sp_udf(DFUDF5(f), LongType)
+    Column]): UserDefinedFunction = sp_udf(new DFUDF5(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -83,7 +83,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function6[Column, Column, Column, Column, Column, Column,
-    Column]): UserDefinedFunction = sp_udf(DFUDF6(f), LongType)
+    Column]): UserDefinedFunction = sp_udf(new DFUDF6(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -91,7 +91,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function7[Column, Column, Column, Column, Column, Column,
-    Column, Column]): UserDefinedFunction = sp_udf(DFUDF7(f), LongType)
+    Column, Column]): UserDefinedFunction = sp_udf(new DFUDF7(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -99,7 +99,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function8[Column, Column, Column, Column, Column, Column,
-    Column, Column, Column]): UserDefinedFunction = sp_udf(DFUDF8(f), LongType)
+    Column, Column, Column]): UserDefinedFunction = sp_udf(new DFUDF8(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -107,7 +107,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function9[Column, Column, Column, Column, Column, Column,
-    Column, Column, Column, Column]): UserDefinedFunction = sp_udf(DFUDF9(f), LongType)
+    Column, Column, Column, Column]): UserDefinedFunction = sp_udf(new DFUDF9(f), LongType)
 
   /**
    * Defines a Scala closure of Columns as user-defined function (UDF).
@@ -115,7 +115,7 @@ class FunctionsImpl extends Functions {
    * nondeterministic, call the API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: Function10[Column, Column, Column, Column, Column, Column,
-    Column, Column, Column, Column, Column]): UserDefinedFunction = sp_udf(DFUDF10(f), LongType)
+    Column, Column, Column, Column, Column]): UserDefinedFunction = sp_udf(new DFUDF10(f), LongType)
 
 
   //////////////////////////////////////////////////////////////////////////////////////////////
@@ -128,7 +128,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF0[Column]): UserDefinedFunction =
-    sp_udf(JDFUDF0(f), LongType)
+    sp_udf(new JDFUDF0(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -136,7 +136,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF1[Column, Column]): UserDefinedFunction =
-    sp_udf(JDFUDF1(f), LongType)
+    sp_udf(new JDFUDF1(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -144,7 +144,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF2[Column, Column, Column]): UserDefinedFunction =
-    sp_udf(JDFUDF2(f), LongType)
+    sp_udf(new JDFUDF2(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -152,7 +152,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF3[Column, Column, Column, Column]): UserDefinedFunction =
-    sp_udf(JDFUDF3(f), LongType)
+    sp_udf(new JDFUDF3(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -160,7 +160,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF4[Column, Column, Column, Column, Column]): UserDefinedFunction =
-    sp_udf(JDFUDF4(f), LongType)
+    sp_udf(new JDFUDF4(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -168,7 +168,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF5[Column, Column, Column, Column, Column,
-    Column]): UserDefinedFunction = sp_udf(JDFUDF5(f), LongType)
+    Column]): UserDefinedFunction = sp_udf(new JDFUDF5(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -176,7 +176,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF6[Column, Column, Column, Column, Column, Column,
-    Column]): UserDefinedFunction = sp_udf(JDFUDF6(f), LongType)
+    Column]): UserDefinedFunction = sp_udf(new JDFUDF6(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -184,7 +184,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF7[Column, Column, Column, Column, Column, Column,
-    Column, Column]): UserDefinedFunction = sp_udf(JDFUDF7(f), LongType)
+    Column, Column]): UserDefinedFunction = sp_udf(new JDFUDF7(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -192,7 +192,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF8[Column, Column, Column, Column, Column, Column,
-    Column, Column, Column]): UserDefinedFunction = sp_udf(JDFUDF8(f), LongType)
+    Column, Column, Column]): UserDefinedFunction = sp_udf(new JDFUDF8(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -200,7 +200,7 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF9[Column, Column, Column, Column, Column, Column,
-    Column, Column, Column, Column]): UserDefinedFunction = sp_udf(JDFUDF9(f), LongType)
+    Column, Column, Column, Column]): UserDefinedFunction = sp_udf(new JDFUDF9(f), LongType)
 
   /**
    * Defines a Java UDF instance of Columns as user-defined function (UDF).
@@ -208,5 +208,6 @@ class FunctionsImpl extends Functions {
    * API `UserDefinedFunction.asNondeterministic()`.
    */
   override def df_udf(f: UDF10[Column, Column, Column, Column, Column, Column,
-    Column, Column, Column, Column, Column]): UserDefinedFunction = sp_udf(JDFUDF10(f), LongType)
+    Column, Column, Column, Column, Column]): UserDefinedFunction =
+    sp_udf(new JDFUDF10(f), LongType)
 }
\ No newline at end of file
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AbstractGpuJoinIterator.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AbstractGpuJoinIterator.scala
index 35ff58d81d9..5eb4d3bfcd5 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AbstractGpuJoinIterator.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AbstractGpuJoinIterator.scala
@@ -23,7 +23,6 @@ import com.nvidia.spark.rapids.RmmRapidsRetryIterator.{splitTargetSizeInHalfGpu,
 import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.Attribute
 import org.apache.spark.sql.catalyst.plans.{InnerLike, JoinType, LeftOuter, RightOuter}
 import org.apache.spark.sql.rapids.execution.GatherMapsResult
@@ -148,7 +147,7 @@ abstract class AbstractGpuJoinIterator(
         // less from the gatherer, but because the gatherer tracks how much is used, the
         // next call to this function will start in the right place.
         val estimatedDataSize = (gather.numRowsLeft * gather.realCheapPerRowSizeEstimate).toLong
-        val targetSizeWrapper = AutoCloseableTargetSize(targetSize, minTargetSize,
+        val targetSizeWrapper = new AutoCloseableTargetSize(targetSize, minTargetSize,
           estimatedDataSize)
         gather.checkpoint()
         withRetry(targetSizeWrapper, splitTargetSizeInHalfGpu) { attempt =>
@@ -199,7 +198,7 @@ abstract class SplittableJoinIterator(
       targetSize,
       sizeEstimateThreshold,
       opTime = opTime,
-      joinTime = joinTime) with Logging {
+      joinTime = joinTime) with RapidsLocalLog {
   // For some join types even if there is no stream data we might output something
   private var isInitialJoin = true
   // If the join explodes this holds batches from the stream side split into smaller pieces.
@@ -364,7 +363,7 @@ abstract class SplittableJoinIterator(
         case None if joinType == RightOuter && rightData.numCols > 0 =>
           // Distinct right outer joins only produce a single gather map since right table rows
           // are not rearranged by the join.
-          MultiJoinGather(leftGatherer, new JoinGathererSameTable(rightData))
+          new MultiJoinGather(leftGatherer, new JoinGathererSameTable(rightData))
         case None =>
           // When there isn't a `rightMap` we are in either LeftSemi or LeftAnti joins.
           // In these cases, the map and the table are both the left side, and everything in the map
@@ -383,7 +382,7 @@ abstract class SplittableJoinIterator(
           }
           val lazyRightMap = LazySpillableGatherMap(right, "right_map")
           val rightGatherer = JoinGatherer(lazyRightMap, rightData, rightOutOfBoundsPolicy)
-          MultiJoinGather(leftGatherer, rightGatherer)
+          new MultiJoinGather(leftGatherer, rightGatherer)
       }
       if (gatherer.isDone) {
         // Nothing matched...
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AbstractHostByteBufferIterator.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AbstractHostByteBufferIterator.scala
deleted file mode 100644
index 24f3bacf28b..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AbstractHostByteBufferIterator.scala
+++ /dev/null
@@ -1,103 +0,0 @@
-/*
- * Copyright (c) 2023, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import java.nio.ByteBuffer
-
-import ai.rapids.cudf.{Cuda, HostMemoryBuffer, MemoryBuffer}
-
-abstract class AbstractHostByteBufferIterator
-    extends Iterator[ByteBuffer] {
-  private[this] var nextBufferStart: Long = 0L
-
-  val totalLength: Long
-
-  protected val limit: Long = Integer.MAX_VALUE
-
-  def getByteBuffer(offset: Long, length: Long): ByteBuffer
-
-  override def hasNext: Boolean = nextBufferStart < totalLength
-
-  override def next(): ByteBuffer = {
-    val offset = nextBufferStart
-    val length = Math.min(totalLength - nextBufferStart, limit)
-    nextBufferStart += length
-    getByteBuffer(offset, length)
-  }
-}
-
-/**
- * Create an iterator that will emit ByteBuffer instances sequentially
- * to work around the 2GB ByteBuffer size limitation. This allows
- * the entire address range of a >2GB host buffer to be covered
- * by a sequence of ByteBuffer instances.
- * <p>NOTE: It is the caller's responsibility to ensure this iterator
- * does not outlive the host buffer. The iterator DOES NOT increment
- * the reference count of the host buffer to ensure it remains valid.
- *
- * @param hostBuffer host buffer to iterate
- * @return ByteBuffer iterator
- */
-class HostByteBufferIterator(hostBuffer: HostMemoryBuffer)
-    extends AbstractHostByteBufferIterator {
-  override protected val limit: Long = Integer.MAX_VALUE
-
-  override val totalLength: Long = if (hostBuffer == null) {
-    0
-  } else {
-    hostBuffer.getLength
-  }
-
-  override def getByteBuffer(offset: Long, length: Long): ByteBuffer = {
-    hostBuffer.asByteBuffer(offset, length.toInt)
-  }
-}
-
-/**
- * Create an iterator that will emit ByteBuffer instances sequentially
- * to work around the 2GB ByteBuffer size limitation after copying a `MemoryBuffer`
- * (which is likely a `DeviceMemoryBuffer`) to a host-backed bounce buffer
- * that is likely smaller than 2GB.
- * @note It is the caller's responsibility to ensure this iterator
- *   does not outlive `memoryBuffer`. The iterator DOES NOT increment
- *   the reference count of `memoryBuffer` to ensure it remains valid.
- * @param memoryBuffer memory buffer to copy. This is likely a DeviceMemoryBuffer
- * @param bounceBuffer a host bounce buffer that will be used to stage copies onto the host
- * @param stream stream to synchronize on after staging to bounceBuffer
- * @return ByteBuffer iterator
- */
-class MemoryBufferToHostByteBufferIterator(
-    memoryBuffer: MemoryBuffer,
-    bounceBuffer: HostMemoryBuffer,
-    stream: Cuda.Stream)
-    extends AbstractHostByteBufferIterator {
-  override val totalLength: Long = if (memoryBuffer == null) {
-    0
-  } else {
-    memoryBuffer.getLength
-  }
-
-  override protected val limit: Long =
-    Math.min(bounceBuffer.getLength, Integer.MAX_VALUE)
-
-  override def getByteBuffer(offset: Long, length: Long): ByteBuffer = {
-    bounceBuffer
-      .copyFromMemoryBufferAsync(0, memoryBuffer, offset, length, stream)
-    stream.sync()
-    bounceBuffer.asByteBuffer(0, length.toInt)
-  }
-}
\ No newline at end of file
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AllocationRetryCoverageTracker.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AllocationRetryCoverageTracker.scala
index 937ac453672..3c3359682ba 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AllocationRetryCoverageTracker.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AllocationRetryCoverageTracker.scala
@@ -23,7 +23,6 @@ import java.util.regex.Pattern
 
 import com.nvidia.spark.rapids.Arm.withResource
 
-import org.apache.spark.internal.Logging
 
 /**
  * Memory allocation kind for retry coverage tracking.
@@ -62,7 +61,17 @@ object AllocationKind extends Enumeration {
  * 
  * See: https://github.com/NVIDIA/spark-rapids/issues/13672
  */
-object AllocationRetryCoverageTracker extends Logging {
+object AllocationRetryCoverageTracker {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    log.error(msg, throwable)
+  }
+
   import AllocationKind._
 
   // Environment variable to enable retry coverage tracking (debug-only).
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ArrayIndexUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ArrayIndexUtils.scala
deleted file mode 100644
index c4c2bd3acb4..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ArrayIndexUtils.scala
+++ /dev/null
@@ -1,53 +0,0 @@
-/*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import ai.rapids.cudf.{ColumnVector, ColumnView, Table}
-import com.nvidia.spark.rapids.Arm.withResource
-
-object ArrayIndexUtils {
-
-  /**
-   * Return the first int value (should be valid) in 'indices' and 'numElements' as a pair
-   * where the corresponding row in 'mask' is true. Null rows in mask are skipped.
-   *
-   * Both 'indices' and 'numElements' should be column of int, and have the same row number.
-   * 'mask' should be a boolean column, and have the same row number with 'indices'.
-   * Otherwise, the behavior is undefined.
-   *
-   * This is made for outputting more details for invalid index error in GpuElementAt and
-   * GpuGetArrayItem. So the caller should take care of the limitations.
-   */
-  def firstIndexAndNumElementUnchecked(mask: ColumnView, indices: ColumnVector,
-      numElements: ColumnVector): (Int, Int) = {
-    val filteredTable = withResource(new Table(indices, numElements)) { indexTable =>
-      indexTable.filter(mask)
-    }
-    withResource(filteredTable) { _ =>
-      assert(filteredTable.getRowCount > 0)
-      val index = withResource(filteredTable.getColumn(0).copyToHost()) { indicesH =>
-        assert(!indicesH.isNull(0))
-        indicesH.getInt(0)
-      }
-      val numElement = withResource(filteredTable.getColumn(1).copyToHost()) { numElemsH =>
-        assert(!numElemsH.isNull(0))
-        numElemsH.getInt(0)
-      }
-      (index, numElement)
-    }
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ArrayUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ArrayUtils.scala
index b353aa4f126..05a32a16a37 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ArrayUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ArrayUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -19,7 +19,7 @@ package com.nvidia.spark.rapids
 import org.apache.spark.sql.catalyst.expressions.{ArrayDistinct, Expression}
 import org.apache.spark.sql.rapids.GpuArrayDistinct
 
-case class GpuArrayDistinctMeta(
+class GpuArrayDistinctMeta(
   expr: ArrayDistinct,
   override val conf: RapidsConf,
   parentMetaOpt: Option[RapidsMeta[_, _, _]],
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AstUtil.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AstUtil.scala
index f2ce4d8a39f..90f935ac57b 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AstUtil.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AstUtil.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -110,7 +110,7 @@ object AstUtil {
       val gpuExpr = expr.convertToGpu()
       
       // Check if we've already processed this expression (for deduplication)
-      processed.get(GpuExpressionEquals(gpuExpr)) match {
+      processed.get(new GpuExpressionEquals(gpuExpr)) match {
         case Some(replacement) => 
           replacement
         case None =>
@@ -135,7 +135,7 @@ object AstUtil {
           // Create an AttributeReference explicitly to avoid issues with unresolved aliases
           val attributeRef = AttributeReference(alias.name, gpuExpr.dataType, 
             gpuExpr.nullable, alias.metadata)(alias.exprId, alias.qualifier)
-          processed.put(GpuExpressionEquals(gpuExpr), attributeRef)
+          processed.put(new GpuExpressionEquals(gpuExpr), attributeRef)
           attributeRef
       }
     } else {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AvroDataFileReader.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AvroDataFileReader.scala
index aaecf016871..bbc8f2a5dfd 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AvroDataFileReader.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/AvroDataFileReader.scala
@@ -33,7 +33,7 @@ import org.apache.commons.io.output.CountingOutputStream
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.sql.rapids.shims.TrampolineConnectShims
+import org.apache.spark.sql.rapids.execution.TrampolineUtil
 
 private[rapids] class AvroSeekableInputStream(in: SeekableInput) extends InputStream
     with SeekableInput {
@@ -82,7 +82,7 @@ case class Header(
   @transient
   lazy val schema: Schema = {
     getMetaString(SCHEMA)
-      .map(s => TrampolineConnectShims.createSchemaParser().parse(s))
+      .map(s => TrampolineUtil.createSchemaParser().parse(s))
       .orNull
   }
 
@@ -127,26 +127,6 @@ object Header {
   }
 }
 
-/**
- * The each Avro block information
- *
- * @param blockStart the start of block
- * @param blockSize  the whole block size = the size between two sync buffers + sync buffer
- * @param dataSize   the block data size
- * @param count      how many entries in this block
- */
-case class BlockInfo(blockStart: Long, blockSize: Long, dataSize: Long, count: Long)
-
-/**
- * The mutable version of the BlockInfo without block start.
- * This is for reusing an existing instance when accessing data in the iterator pattern.
- *
- * @param blockSize the whole block size (the size between two sync buffers + sync buffer size)
- * @param dataSize  the data size in this block
- * @param count   how many entries in this block
- */
-case class MutableBlockInfo(var blockSize: Long, var dataSize: Long, var count: Long)
-
 /** The parent of the Rapids Avro file readers */
 abstract class AvroFileReader(si: SeekableInput) extends AutoCloseable {
   // Children should update this pointer accordingly.
@@ -328,7 +308,7 @@ class AvroMetaFileReader(si: SeekableInput) extends AvroFileReader(si) {
       val dataSizeLongLen = BinaryData.encodeLong(blockDataSize, buf, 0)
       // (len of entries) + (len of block size) + (block size) + (sync size)
       val blockLength = countLongLen + dataSizeLongLen + blockDataSize + SYNC_SIZE
-      blocks += BlockInfo(curBlockStart, blockLength, blockDataSize, blockCount)
+      blocks += new BlockInfo(curBlockStart, blockLength, blockDataSize, blockCount)
 
       // Do we need to check the SYNC BUFFER, or just let cudf do it?
       curBlockStart += blockLength
@@ -405,11 +385,11 @@ class AvroDataFileReader(si: SeekableInput) extends AvroFileReader(si) {
       throw new NoSuchElementException
     }
     if (reuse == null) {
-      MutableBlockInfo(curBlockSize, curDataSize, curCount)
+      new MutableBlockInfo(curBlockSize, curDataSize, curCount)
     } else {
-      reuse.blockSize = curBlockSize
-      reuse.dataSize = curDataSize
-      reuse.count = curCount
+      reuse.setBlockSize(curBlockSize)
+      reuse.setDataSize(curDataSize)
+      reuse.setCount(curCount)
       reuse
     }
   }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BatchWithPartitionData.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BatchWithPartitionData.scala
index d0f61d884d7..8d52586bcd7 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BatchWithPartitionData.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BatchWithPartitionData.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,28 +28,6 @@ import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.types.{StringType, StructType}
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-/**
- * Wrapper class that specifies how many rows to replicate
- * the partition value.
- */
-case class PartitionRowData(rowValue: InternalRow, rowNum: Int)
-
-object PartitionRowData {
-  def from(rowValues: Array[InternalRow], rowNums: Array[Int]): Array[PartitionRowData] = {
-    rowValues.zip(rowNums).map {
-      case (rowValue, rowNum) => PartitionRowData(rowValue, rowNum)
-    }
-  }
-
-  def from(rowValues: Array[InternalRow], rowNums: Array[Long]): Array[PartitionRowData] = {
-    rowValues.zip(rowNums).map {
-      case (rowValue, rowNum) =>
-        require(rowNum <= Integer.MAX_VALUE, s"Row number $rowNum exceeds max value of an integer.")
-        PartitionRowData(rowValue, rowNum.toInt)
-    }
-  }
-}
-
 /**
  * Class to wrap columnar batch and partition rows data and utility functions to merge them.
  *
@@ -59,10 +37,10 @@ object PartitionRowData {
  *                             rows to replicate the partition value.
  * @param partitionSchema      Schema of the partitioned data.
  */
-case class BatchWithPartitionData(
-    inputBatch: SpillableColumnarBatch,
-    partitionedRowsData: Array[PartitionRowData],
-    partitionSchema: StructType) extends AutoCloseable {
+class BatchWithPartitionData(
+    val inputBatch: SpillableColumnarBatch,
+    val partitionedRowsData: Array[PartitionRowData],
+    val partitionSchema: StructType) extends AutoCloseable {
 
   /**
    * Merges the partitioned data with the input ColumnarBatch.
@@ -98,7 +76,9 @@ case class BatchWithPartitionData(
         val dataType = field.dataType
         // Create an array to hold the individual columns for each partition.
         val singlePartCols = partitionedRowsData.safeMap {
-          case PartitionRowData(valueRow, rowNum) =>
+          partitionRowData =>
+            val valueRow = partitionRowData.rowValue
+            val rowNum = partitionRowData.rowNum
             val singleValue = valueRow.get(colIndex, dataType)
             withResource(GpuScalar.from(singleValue, dataType)) { singleScalar =>
               // Create a column vector from the GPU scalar, associated with the row number.
@@ -272,14 +252,14 @@ object BatchWithPartitionDataUtils {
       // Splitting occurs if for any column, maximum rows we can fit is less than rows in partition.
       splitOccurred = maxRows < rowsInPartition
       if (splitOccurred) {
-        currentBatch.append(PartitionRowData(valuesInPartition, maxRows))
+        currentBatch.append(new PartitionRowData(valuesInPartition, maxRows))
         resultBatches.append(currentBatch.toArray)
         currentBatch.clear()
         java.util.Arrays.fill(sizeOfBatch, 0)
         rowsInPartition -= maxRows
       } else {
         // If there was no split, all rows can fit in current batch.
-        currentBatch.append(PartitionRowData(valuesInPartition, rowsInPartition))
+        currentBatch.append(new PartitionRowData(valuesInPartition, rowsInPartition))
         val partitionSizes = calculatePartitionSizes(rowsInPartition, valuesInPartition, partSchema)
         sizeOfBatch.indices.foreach(i => sizeOfBatch(i) += partitionSizes(i))
       }
@@ -364,7 +344,7 @@ object BatchWithPartitionDataUtils {
       // Combine the split GPU ColumnVectors with partition ColumnVectors.
       splitColumnarBatches.zip(listOfPartitionedRowsData).map {
         case (spillableBatch, partitionedRowsData) =>
-          BatchWithPartitionData(spillableBatch, partitionedRowsData, partitionSchema)
+          new BatchWithPartitionData(spillableBatch, partitionedRowsData, partitionSchema)
       }
     }
   }
@@ -397,9 +377,7 @@ object BatchWithPartitionDataUtils {
       listOfPartitionedRowsData: Array[Array[PartitionRowData]]): Seq[Int] = {
     // Calculate the row counts for each batch
     val rowCountsForEachBatch = listOfPartitionedRowsData.map(partitionData =>
-      partitionData.map {
-        case PartitionRowData(_, rowNum) => rowNum
-      }.sum
+      partitionData.map(_.rowNum).sum
     )
     // Calculate split indices using cumulative sum
     rowCountsForEachBatch.scanLeft(0)(_ + _).drop(1).dropRight(1)
@@ -479,13 +457,13 @@ object BatchWithPartitionDataUtils {
         if (remainingRows > 0) {
           // Add rows to the left partition, up to the remaining rows available
           val rowsToAddToLeft = Math.min(partitionRow.rowNum, remainingRows)
-          leftHalf += partitionRow.copy(rowNum = rowsToAddToLeft)
+          leftHalf += new PartitionRowData(partitionRow.rowValue, rowsToAddToLeft)
           rowsAddedToLeft += rowsToAddToLeft
           remainingRows -= rowsToAddToLeft
           if (remainingRows <= 0) {
             // Add remaining rows to the right partition
             val rowsToAddToRight = partitionRow.rowNum - rowsToAddToLeft
-            rightHalf += partitionRow.copy(rowNum = rowsToAddToRight)
+            rightHalf += new PartitionRowData(partitionRow.rowValue, rowsToAddToRight)
             rowsAddedToRight += rowsToAddToRight
           }
         } else {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BoolUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BoolUtils.scala
deleted file mode 100644
index 35283e01119..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BoolUtils.scala
+++ /dev/null
@@ -1,62 +0,0 @@
-/*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import ai.rapids.cudf.{ColumnVector, DType}
-import com.nvidia.spark.rapids.Arm.withResource
-
-object BoolUtils {
-
-  /**
-   * Whether all the valid rows in 'col' are true. An empty column will get true.
-   * null rows are skipped.
-   */
-  def isAllValidTrue(col: ColumnVector): Boolean = {
-    assert(DType.BOOL8 == col.getType, "input column type is not bool")
-    if (col.getRowCount == 0) {
-      return true
-    }
-
-    if (col.getRowCount == col.getNullCount) {
-      // all is null, equal to empty, since nulls should be skipped.
-      return true
-    }
-    withResource(col.all()) { allTrue =>
-      // Guaranteed there is at least one row and not all of the rows are null,
-      // so result scalar must be valid
-      allTrue.getBoolean
-    }
-  }
-
-  /**
-   * Whether there is any valid row in 'col' and it is true. An empty column will get false.
-   * null rows are skipped.
-   */
-  def isAnyValidTrue(col: ColumnVector): Boolean = {
-    assert(DType.BOOL8 == col.getType, "input column type is not bool")
-
-    if (col.getRowCount == col.getNullCount) {
-      // all is null, return false since nulls should be skipped.
-      return false
-    }
-    withResource(col.any()) { anyTrue =>
-      // Guaranteed there is at least one row and not all of the rows are null,
-      // so result scalar must be valid
-      anyTrue.getBoolean
-    }
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BucketJoinTwoSidesPrefetch.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BucketJoinTwoSidesPrefetch.scala
index a7acd9a1172..ae14942d66f 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BucketJoinTwoSidesPrefetch.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/BucketJoinTwoSidesPrefetch.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -15,7 +15,6 @@
  */
 package com.nvidia.spark.rapids
 
-import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.execution.SparkPlan
 import org.apache.spark.sql.execution.exchange.Exchange
 import org.apache.spark.sql.rapids.GpuFileSourceScanExec
@@ -28,7 +27,7 @@ import org.apache.spark.sql.rapids.GpuFileSourceScanExec
  *
  * NOTE: This is postShimPlanRule which should be applied after GpuOverrides.
  */
-object BucketJoinTwoSidesPrefetch extends Rule[SparkPlan] {
+object BucketJoinTwoSidesPrefetch {
 
   // Traverse through the plan tree and enable IO prefetch for all GpuFileSourceScanExec
   // which are directly connected to this join node without any shuffle.
@@ -44,7 +43,7 @@ object BucketJoinTwoSidesPrefetch extends Rule[SparkPlan] {
     }
   }
 
-  override def apply(plan: SparkPlan): SparkPlan = {
+  def apply(plan: SparkPlan): SparkPlan = {
     // Enable IO prefetch by a mutable operation on target nodes instead of re-generating
     // the plan tree. By doing so, it saves a lot of trouble.
     if (RapidsConf.BUCKET_JOIN_IO_PREFETCH.get(plan.conf)) {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ColumnarOutputWriter.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ColumnarOutputWriter.scala
index feacd649a2e..8c72b7f9bea 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ColumnarOutputWriter.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ColumnarOutputWriter.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -32,7 +32,6 @@ import org.apache.hadoop.fs.Path
 import org.apache.hadoop.mapreduce.TaskAttemptContext
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.{ColumnarWriteTaskStatsTracker, GpuWriteTaskStatsTracker}
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.vectorized.ColumnarBatch
@@ -81,7 +80,23 @@ abstract class ColumnarOutputWriter(context: TaskAttemptContext,
     debugDumpPath: Option[String],
     holdGpuBetweenBatches: Boolean = false,
     useAsyncWrite: Boolean = false,
-    rapidsFileIO: RapidsFileIO) extends HostBufferConsumer with Logging {
+    rapidsFileIO: RapidsFileIO) extends HostBufferConsumer {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    log.error(msg, throwable)
+  }
+
 
   // Length of the file written so far. This is used to track the size of the file
   private var fileLength: Long = 0L
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CopyCompressionCodec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CopyCompressionCodec.scala
index e2e86495b16..e2d0409c68b 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CopyCompressionCodec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CopyCompressionCodec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -51,7 +51,7 @@ class BatchedCopyCompressor(maxBatchMemory: Long, stream: Cuda.Stream)
           ct,
           CodecType.COPY,
           outBuffer.getLength)
-        CompressedTable(outBuffer.getLength, meta, outBuffer)
+        new CompressedTable(outBuffer.getLength, meta, outBuffer)
       }
     }
     closeOnExcept(result) { _ => stream.sync() }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CostBasedOptimizer.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CostBasedOptimizer.scala
index cb79e329e7a..a9e248c72d9 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CostBasedOptimizer.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/CostBasedOptimizer.scala
@@ -20,7 +20,6 @@ import scala.collection.mutable.ListBuffer
 
 import com.nvidia.spark.rapids.shims.{GlobalLimitShims, QueryStageRowCountShims, SparkShimImpl}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.{Alias, AttributeReference, Expression, GetStructField, WindowFrame, WindowSpecDefinition}
 import org.apache.spark.sql.catalyst.plans.{JoinType, LeftAnti, LeftSemi}
 import org.apache.spark.sql.execution.{GlobalLimitExec, LocalLimitExec, SparkPlan, TakeOrderedAndProjectExec, UnionExec}
@@ -51,7 +50,13 @@ trait Optimizer {
  * data to the GPU just for a trivial projection and then have to move data back to the CPU on the
  * next step.
  */
-class CostBasedOptimizer extends Optimizer with Logging {
+class CostBasedOptimizer extends Optimizer {
+
+  @transient private lazy val log = org.slf4j.LoggerFactory.getLogger(
+    classOf[CostBasedOptimizer])
+
+  private def logTrace(msg: => String): Unit = if (log.isTraceEnabled) log.trace(msg)
+
 
   /**
    * Walk the plan and determine CPU and GPU costs for each operator and then make decisions
@@ -141,7 +146,7 @@ class CostBasedOptimizer extends Optimizer with Logging {
         // transition and reset the GPU cost
         if (operatorGpuCost + transitionCost > operatorCpuCost && !isExchangeOp(plan)) {
           // avoid transition and keep this operator on CPU
-          optimizations.append(AvoidTransition(plan))
+          optimizations.append(new AvoidTransition(plan))
           plan.costPreventsRunningOnGpu()
           // reset GPU cost
           totalGpuCost = totalCpuCost
@@ -163,7 +168,7 @@ class CostBasedOptimizer extends Optimizer with Logging {
             if (canRunOnGpu(child) && !isExchangeOp(child)
                 && childGpuTotal > childCpuCost) {
               // force this child plan back onto CPU
-              optimizations.append(ReplaceSection(
+              optimizations.append(new ReplaceSection(
                 child, totalCpuCost, totalGpuCost))
               child.recursiveCostPreventsRunningOnGpu()
             }
@@ -193,7 +198,7 @@ class CostBasedOptimizer extends Optimizer with Logging {
       if (canRunOnGpu(plan) && !isExchangeOp(plan)) {
         // this plan would have been on GPU so we move it and onto CPU and recurse down
         // until we reach a part of the plan that is already on CPU and then stop
-        optimizations.append(ReplaceSection(plan, totalCpuCost, totalGpuCost))
+        optimizations.append(new ReplaceSection(plan, totalCpuCost, totalGpuCost))
         plan.recursiveCostPreventsRunningOnGpu()
         // reset the costs because this section of the plan was not moved to GPU
         totalGpuCost = totalCpuCost
@@ -492,15 +497,15 @@ object RowCountPlanVisitor {
 
 sealed abstract class Optimization
 
-case class AvoidTransition[INPUT <: SparkPlan](plan: SparkPlanMeta[INPUT]) extends Optimization {
+class AvoidTransition[INPUT <: SparkPlan](val plan: SparkPlanMeta[INPUT]) extends Optimization {
   override def toString: String = s"It is not worth moving to GPU for operator: " +
       s"${Explain.format(plan)}"
 }
 
-case class ReplaceSection[INPUT <: SparkPlan](
-    plan: SparkPlanMeta[INPUT],
-    totalCpuCost: Double,
-    totalGpuCost: Double) extends Optimization {
+class ReplaceSection[INPUT <: SparkPlan](
+    val plan: SparkPlanMeta[INPUT],
+    val totalCpuCost: Double,
+    val totalGpuCost: Double) extends Optimization {
   override def toString: String = s"It is not worth keeping this section on GPU; " +
       s"gpuCost=$totalGpuCost, cpuCost=$totalCpuCost:\n${Explain.format(plan)}"
 }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DateUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DateUtils.scala
index 795258dfe14..ae5e172c144 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DateUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DateUtils.scala
@@ -16,13 +16,12 @@
 
 package com.nvidia.spark.rapids
 
-import java.time.LocalDate
+import java.time.{Instant, LocalDate}
 
 import scala.collection.mutable.ListBuffer
 
 import ai.rapids.cudf.{DType, Scalar}
 import com.nvidia.spark.rapids.VersionUtils.isSpark320OrLater
-import com.nvidia.spark.rapids.shims.DateTimeUtilsShims
 
 import org.apache.spark.sql.catalyst.util.DateTimeUtils.localDateToDays
 import org.apache.spark.sql.internal.SQLConf
@@ -53,6 +52,11 @@ object DateUtils {
 
   val ONE_SECOND_MICROSECONDS = 1000000
 
+  private def currentTimestampMicros: Long = {
+    val instant = Instant.now()
+    instant.getEpochSecond * ONE_SECOND_MICROSECONDS + instant.getNano / 1000
+  }
+
   val ONE_DAY_SECONDS = 86400L
 
   val ONE_DAY_MICROSECONDS = 86400000000L
@@ -80,7 +84,7 @@ object DateUtils {
     Map.empty
   } else {
     val today = currentDate()
-    val now = DateTimeUtilsShims.currentTimestamp
+    val now = currentTimestampMicros
     Map(
       EPOCH -> 0,
       NOW -> now / 1000000L,
@@ -94,7 +98,7 @@ object DateUtils {
     Map.empty
   } else {
     val today = currentDate()
-    val now = DateTimeUtilsShims.currentTimestamp
+    val now = currentTimestampMicros
     Map(
       EPOCH -> 0,
       NOW -> now,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DecimalUtil.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DecimalUtil.scala
deleted file mode 100644
index 7538df81688..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DecimalUtil.scala
+++ /dev/null
@@ -1,60 +0,0 @@
-/*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import ai.rapids.cudf
-import ai.rapids.cudf.{DecimalUtils, DType}
-
-import org.apache.spark.sql.types._
-
-object DecimalUtil {
-
-  def createCudfDecimal(dt: DecimalType): DType =
-    DecimalUtils.createDecimalType(dt.precision, dt.scale)
-
-  def outOfBounds(input: cudf.ColumnView, to: DecimalType): cudf.ColumnVector =
-    DecimalUtils.outOfBounds(input, to.precision, to.scale)
-
-  /**
-   * Return the size in bytes of the Fixed-width data types.
-   * WARNING: Do not use this method for variable-width data types
-   */
-  private[rapids] def getDataTypeSize(dt: DataType): Int = {
-    dt match {
-      case d: DecimalType if d.precision <= Decimal.MAX_INT_DIGITS => 4
-      case t => t.defaultSize
-    }
-  }
-
-  // The following types were copied from Spark's DecimalType class
-  private val BooleanDecimal = DecimalType(1, 0)
-
-  def optionallyAsDecimalType(t: DataType): Option[DecimalType] = t match {
-    case dt: DecimalType => Some(dt)
-    case ByteType | ShortType | IntegerType | LongType =>
-      Some(DecimalType(GpuColumnVector.getNonNestedRapidsType(t).getPrecisionForInt, 0))
-    case BooleanType => Some(BooleanDecimal)
-    case _ => None
-  }
-
-  def asDecimalType(t: DataType): DecimalType = optionallyAsDecimalType(t) match {
-    case Some(dt) => dt
-    case _ =>
-      throw new IllegalArgumentException(
-        s"Internal Error: type $t cannot automatically be cast to a supported DecimalType")
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DeviceMemoryEventHandler.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DeviceMemoryEventHandler.scala
index f4723a7ff0f..f1a61d5d563 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DeviceMemoryEventHandler.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DeviceMemoryEventHandler.scala
@@ -24,7 +24,6 @@ import ai.rapids.cudf.{Cuda, Rmm, RmmEventHandler}
 import com.nvidia.spark.rapids.spill.SpillableDeviceStore
 import com.sun.management.HotSpotDiagnosticMXBean
 
-import org.apache.spark.internal.Logging
 
 /**
  * RMM event handler to trigger spilling from the device memory store.
@@ -36,7 +35,23 @@ import org.apache.spark.internal.Logging
 class DeviceMemoryEventHandler(
     store: SpillableDeviceStore,
     oomDumpDir: Option[String],
-    maxFailedOOMRetries: Int) extends RmmEventHandler with Logging {
+    maxFailedOOMRetries: Int) extends RmmEventHandler {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    log.error(msg, throwable)
+  }
+
 
   // Flag that ensures we dump stack traces once and not for every allocation
   // failure. The assumption is that unhandled allocations will be fatal
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DumpUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DumpUtils.scala
index c59977cdab6..c5a1dad551a 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DumpUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/DumpUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,10 +28,15 @@ import com.nvidia.spark.rapids.jni.kudo.KudoSerializer
 import org.apache.commons.io.IOUtils
 import org.apache.hadoop.conf.Configuration
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-object DumpUtils extends Logging {
+object DumpUtils {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
   /**
    * Debug utility to dump a host memory buffer to a file.
    *
@@ -51,7 +56,8 @@ object DumpUtils extends Logging {
       prefix: String,
       suffix: String): String = {
     try {
-      val (out, path) = FileUtils.createTempFile(conf, prefix, suffix)
+      val tempFile = FileUtils.createTempFile(conf, prefix, suffix)
+      val out = tempFile.getOutputStream
       withResource(out) { _ =>
         withResource(data.slice(offset, len)) { hmb =>
           withResource(new HostMemoryInputStream(hmb, hmb.getLength)) { in =>
@@ -59,7 +65,7 @@ object DumpUtils extends Logging {
           }
         }
       }
-      path.toString
+      tempFile.getPath.toString
     } catch {
       case e: Exception =>
         log.error(s"Error attempting to dump data", e)
@@ -73,7 +79,8 @@ object DumpUtils extends Logging {
       prefix: String,
       suffix: String): String = {
     try {
-      val (out, path) = FileUtils.createTempFile(conf, prefix, suffix)
+      val tempFile = FileUtils.createTempFile(conf, prefix, suffix)
+      val out = tempFile.getOutputStream
       withResource(out) { _ =>
         data.foreach { hmb =>
           withResource(new HostMemoryInputStream(hmb, hmb.getLength)) { in =>
@@ -81,7 +88,7 @@ object DumpUtils extends Logging {
           }
         }
       }
-      path.toString
+      tempFile.getPath.toString
     } catch {
       case e: Exception =>
         log.error(s"Error attempting to dump data", e)
@@ -324,7 +331,15 @@ private class ColumnIndex() {
   }
 }
 
-object ParquetDumper extends Logging {
+object ParquetDumper {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
   val COMPRESS_TYPE = CompressionType.SNAPPY
 
   def parquetWriterOptionsFromTable[T <: NestedBuilder[_, _], V <: ColumnWriterOptions](
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ExecutorCache.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ExecutorCache.scala
deleted file mode 100644
index 4190d52c9ce..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ExecutorCache.scala
+++ /dev/null
@@ -1,51 +0,0 @@
-/*
- * Copyright (c) 2025, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import java.lang.management.ManagementFactory
-
-import ai.rapids.cudf.{Cuda, CudaComputeMode}
-
-/**
- * A singleton object to cache executor related information.
- * Uses lazy mode to ensure the values are only computed once per executor.
- */
-object ExecutorCache {
-
-  /**
-   * Cache the current device compute mode for current executor.
-   * It's based on the assumption that executor has been assigned to a single device,
-   * and will not change during the lifetime of the executor.
-   * Should be called on executor side.
-   */
-  private[rapids] lazy val getCurrentDeviceComputeMode: CudaComputeMode = Cuda.getComputeMode()
-
-  /**
-   * Cache the current device UUID for current executor.
-   * It's based on the assumption that executor has been assigned to a single device,
-   * and will not change during the lifetime of the executor.
-   * Should be called on executor side.
-   */
-  private[rapids] lazy val getCurrentDeviceUuid: Array[Byte] = Cuda.getGpuUuid()
-
-  /**
-   * Cache the current process name for current executor.
-   * Should be called on executor side.
-   */
-  private[rapids] lazy val getProcessName: String = ManagementFactory.getRuntimeMXBean.getName
-}
-
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FileUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FileUtils.scala
deleted file mode 100644
index 5fe0f53d2d6..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FileUtils.scala
+++ /dev/null
@@ -1,46 +0,0 @@
-/*
- * Copyright (c) 2019, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import scala.util.Random
-
-import org.apache.hadoop.conf.Configuration
-import org.apache.hadoop.fs.{FileAlreadyExistsException, FSDataOutputStream, Path}
-
-object FileUtils {
-  def createTempFile(
-      conf: Configuration,
-      pathPrefix: String,
-      pathSuffix: String): (FSDataOutputStream, Path) = {
-    val fs = new Path(pathPrefix).getFileSystem(conf)
-    val rnd = new Random
-    var out: FSDataOutputStream = null
-    var path: Path = null
-    var succeeded = false
-    val suffix = if (pathSuffix != null) pathSuffix else ""
-    while (!succeeded) {
-      path = new Path(pathPrefix + rnd.nextInt(Integer.MAX_VALUE) + suffix)
-      if (!fs.exists(path)) {
-        scala.util.control.Exception.ignoring(classOf[FileAlreadyExistsException]) {
-          out = fs.create(path, false)
-          succeeded = true
-        }
-      }
-    }
-    (out, path)
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FloatUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FloatUtils.scala
deleted file mode 100644
index 69cad7cc77a..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FloatUtils.scala
+++ /dev/null
@@ -1,87 +0,0 @@
-/*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import ai.rapids.cudf.{ColumnVector, ColumnView, DType, Scalar}
-import com.nvidia.spark.rapids.Arm.withResource
-
-object FloatUtils {
-
-  def nanToZero(cv: ColumnView): ColumnVector = {
-    if (cv.getType() != DType.FLOAT32 && cv.getType() != DType.FLOAT64) {
-      throw new IllegalArgumentException("Only Floats and Doubles allowed")
-    }
-    withResource(cv.isNan()) { isNan =>
-      withResource(
-        if (cv.getType == DType.FLOAT64) {
-          Scalar.fromDouble(0.0d)
-        } else {
-          Scalar.fromFloat(0.0f)
-        }
-      ) {
-        zero => isNan.ifElse(zero, cv)
-      }
-    }
-  }
-
-  def getNanScalar(dType: DType): Scalar = {
-    if (dType == DType.FLOAT64) {
-      Scalar.fromDouble(Double.NaN)
-    } else if (dType == DType.FLOAT32) {
-      Scalar.fromFloat(Float.NaN)
-    } else {
-      throw new IllegalArgumentException("NaNs are only supported for Float types")
-    }
-  }
-
-  def getPositiveInfinityScalar(dType: DType): Scalar = {
-    if (dType == DType.FLOAT64) {
-      Scalar.fromDouble(Double.PositiveInfinity)
-    } else {
-      Scalar.fromFloat(Float.PositiveInfinity)
-    }
-  }
-
-  def getNegativeInfinityScalar(dType: DType): Scalar = {
-    if (dType == DType.FLOAT64) {
-      Scalar.fromDouble(Double.NegativeInfinity)
-    } else {
-      Scalar.fromFloat(Float.NegativeInfinity)
-    }
-  }
-
-  def getInfinityVector(dtype: DType): ColumnVector = {
-    if (dtype == DType.FLOAT64) {
-      ColumnVector.fromDoubles(Double.PositiveInfinity, Double.NegativeInfinity)
-    } else {
-      ColumnVector.fromFloats(Float.PositiveInfinity, Float.NegativeInfinity)
-    }
-  }
-
-  def infinityToNulls(vec: ColumnVector): ColumnVector = {
-    def getNullVector: ColumnVector = {
-      if (vec.getType == DType.FLOAT64) ColumnVector.fromBoxedDoubles(null, null)
-      else ColumnVector.fromBoxedFloats(null, null)
-    }
-
-    withResource(getInfinityVector(vec.getType)) { infinityVector =>
-      withResource(getNullVector) { nullVector =>
-        vec.findAndReplaceAll(infinityVector, nullVector)
-      }
-    }
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FoldLocalAggregate.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FoldLocalAggregate.scala
index 49600ee98f7..0a0359d7bbf 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FoldLocalAggregate.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/FoldLocalAggregate.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -15,9 +15,7 @@
  */
 package com.nvidia.spark.rapids
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.aggregate._
-import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.execution.SparkPlan
 import org.apache.spark.sql.execution.aggregate._
 
@@ -28,8 +26,16 @@ import org.apache.spark.sql.execution.aggregate._
  * redistribute data before final aggregate. The Local Aggregate may emerge under certain
  * circumstance, such as the BucketScan Spec fully matches the groupBy keys.
  */
-object FoldLocalAggregate extends Rule[SparkPlan] {
-  override def apply(plan: SparkPlan): SparkPlan = {
+object FoldLocalAggregate {
+  private val log = org.slf4j.LoggerFactory.getLogger(FoldLocalAggregate.getClass)
+
+  private def logError(msg: => String): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg)
+    }
+  }
+
+  def apply(plan: SparkPlan): SparkPlan = {
     plan.transform {
       case p@LocalAggregatePattern(finalAgg: BaseAggregateExec, partAgg: BaseAggregateExec) =>
         // Spark eliminates the filter for the aggExpressions in Final mode. So, we need to copy
@@ -84,7 +90,16 @@ object FoldLocalAggregate extends Rule[SparkPlan] {
  * The LocalAggregate can be emerged regardless HashAggregateExec, SortAggregateExec or
  * ObjectHashAggregateExec.
  */
-object LocalAggregatePattern extends Logging {
+object LocalAggregatePattern {
+  private val log = org.slf4j.LoggerFactory.getLogger(LocalAggregatePattern.getClass)
+
+  private def logError(msg: => String): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg)
+    }
+  }
+
+
   def unapply(plan: SparkPlan): Option[(BaseAggregateExec, BaseAggregateExec)] = {
     plan match {
       case hashAgg: HashAggregateExec
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuAggregateExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuAggregateExec.scala
index ae870049a45..0bb1e276aa6 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuAggregateExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuAggregateExec.scala
@@ -31,7 +31,6 @@ import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 import com.nvidia.spark.rapids.shims.AggregationTagging
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Alias, Ascending, Attribute, AttributeReference, AttributeSeq, AttributeSet, Expression, ExprId, If, NamedExpression, SortOrder}
@@ -48,7 +47,15 @@ import org.apache.spark.sql.rapids.execution.{GpuBatchSubPartitioner, GpuShuffle
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-object AggregateUtils extends Logging {
+object AggregateUtils {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   private val aggs = List("min", "max", "avg", "sum", "count", "first", "last")
 
@@ -308,40 +315,20 @@ object AggregateUtils extends Logging {
 }
 
 /** Utility class to hold all of the metrics related to hash aggregation */
-case class GpuHashAggregateMetrics(
-    numOutputRows: GpuMetric,
-    numOutputBatches: GpuMetric,
-    numTasksRepartitioned: GpuMetric,
-    numTasksSkippedAgg: GpuMetric,
-    opTime: GpuMetric,
-    computeAggTime: GpuMetric,
-    concatTime: GpuMetric,
-    sortTime: GpuMetric,
-    repartitionTime: GpuMetric,
-    numAggOps: GpuMetric,
-    numPreSplits: GpuMetric,
-    singlePassTasks: GpuMetric,
-    heuristicTime: GpuMetric) {
-}
-
-/** Utility class to convey information on the aggregation modes being used */
-case class AggregateModeInfo(
-    uniqueModes: Seq[AggregateMode],
-    hasPartialMode: Boolean,
-    hasPartialMergeMode: Boolean,
-    hasFinalMode: Boolean,
-    hasCompleteMode: Boolean)
-
-object AggregateModeInfo {
-  def apply(uniqueModes: Seq[AggregateMode]): AggregateModeInfo = {
-    AggregateModeInfo(
-      uniqueModes = uniqueModes,
-      hasPartialMode = uniqueModes.contains(Partial),
-      hasPartialMergeMode = uniqueModes.contains(PartialMerge),
-      hasFinalMode = uniqueModes.contains(Final),
-      hasCompleteMode = uniqueModes.contains(Complete)
-    )
-  }
+class GpuHashAggregateMetrics(
+    val numOutputRows: GpuMetric,
+    val numOutputBatches: GpuMetric,
+    val numTasksRepartitioned: GpuMetric,
+    val numTasksSkippedAgg: GpuMetric,
+    val opTime: GpuMetric,
+    val computeAggTime: GpuMetric,
+    val concatTime: GpuMetric,
+    val sortTime: GpuMetric,
+    val repartitionTime: GpuMetric,
+    val numAggOps: GpuMetric,
+    val numPreSplits: GpuMetric,
+    val singlePassTasks: GpuMetric,
+    val heuristicTime: GpuMetric) extends Serializable {
 }
 
 /**
@@ -619,7 +606,8 @@ class AggHelper(
   }
 }
 
-object GpuAggregateIterator extends Logging {
+object GpuAggregateIterator {
+
   /**
    * @note abstracted away for a unit test..
    * @param helper
@@ -753,9 +741,9 @@ object GpuAggFirstPassIterator {
 //  * boundFinalProjections: on merged batches, finalize aggregates
 //     (GpuAverage => CudfSum/CudfCount)
 //  * boundResultReferences: project the result expressions Spark expects in the output.
-case class BoundExpressionsModeAggregates(
-    boundFinalProjections: Option[Seq[GpuExpression]],
-    boundResultReferences: Seq[Expression])
+class BoundExpressionsModeAggregates(
+    val boundFinalProjections: Option[Seq[GpuExpression]],
+    val boundResultReferences: Seq[Expression])
 
 object GpuAggFinalPassIterator {
 
@@ -805,7 +793,7 @@ object GpuAggFinalPassIterator {
     } else {
       GpuBindReferences.bindGpuReferences(resultExpressions, groupingAttributes, metrics)
     }
-    BoundExpressionsModeAggregates(
+    new BoundExpressionsModeAggregates(
       boundFinalProjections,
       boundResultReferences)
   }
@@ -909,7 +897,7 @@ class GpuMergeAggregateIterator(
     localInputRowsCount: LocalGpuMetric,
     allMetrics: Map[String, GpuMetric]
 )
-  extends Iterator[ColumnarBatch] with AutoCloseable with Logging {
+  extends Iterator[ColumnarBatch] with AutoCloseable with RapidsLocalLog {
   private[this] val isReductionOnly = groupingExpressions.isEmpty
   private[this] val targetMergeBatchSize = computeTargetMergeBatchSize(configuredTargetBatchSize)
 
@@ -978,7 +966,7 @@ class GpuMergeAggregateIterator(
             s"$firstPassReductionRatioEstimate")
           // if so, skip any aggregation, return the origin batch directly
 
-          realIter = Some(ConcatIterator(firstPassIter, configuredTargetBatchSize))
+          realIter = Some(new ConcatIterator(firstPassIter, configuredTargetBatchSize))
           metrics.numTasksSkippedAgg += 1
           return realIter.get.next()
         } else {
@@ -1011,7 +999,7 @@ class GpuMergeAggregateIterator(
         metrics.numTasksRepartitioned += 1
       }
 
-      realIter = Some(ConcatIterator(
+      realIter = Some(new ConcatIterator(
         new CloseableBufferedIterator(buildBucketIterator()), configuredTargetBatchSize))
       realIter.get.next()
     }
@@ -1032,7 +1020,7 @@ class GpuMergeAggregateIterator(
     new AggHelper(inputAttributes, groupingExpressions, aggregateExpressions,
       forceMerge = true, conf, isSorted = false, allMetrics)
 
-  private case class ConcatIterator(
+  private class ConcatIterator(
       input: CloseableBufferedIterator[SpillableColumnarBatch],
       targetSize: Long)
     extends Iterator[ColumnarBatch] {
@@ -1061,7 +1049,7 @@ class GpuMergeAggregateIterator(
     }
   }
 
-  private case class RepartitionAggregateIterator(opTime: GpuMetric)
+  private class RepartitionAggregateIterator(opTime: GpuMetric)
     extends Iterator[SpillableColumnarBatch] {
 
     batchesByBucket = batchesByBucket.filter(_.size() > 0)
@@ -1098,7 +1086,7 @@ class GpuMergeAggregateIterator(
 
   /** Build an iterator merging aggregated batches in each bucket. */
   private def buildBucketIterator(): Iterator[SpillableColumnarBatch] = {
-    bucketIter = Some(RepartitionAggregateIterator(opTime = metrics.opTime))
+    bucketIter = Some(new RepartitionAggregateIterator(metrics.opTime))
     bucketIter.get
   }
 
@@ -1952,7 +1940,7 @@ case class GpuHashAggregateExec(
     allowSinglePassAgg: Boolean,
     allowNonFullyAggregatedOutput: Boolean,
     skipAggPassReductionRatio: Double
-) extends GpuPartitioningPreservingUnaryExecNode with GpuExec with Logging {
+) extends GpuPartitioningPreservingUnaryExecNode with GpuExec {
 
   // lifted directly from `BaseAggregateExec.inputAttributes`, edited comment.
   def inputAttributes: Seq[Attribute] =
@@ -1998,7 +1986,7 @@ case class GpuHashAggregateExec(
   }
 
   override def internalDoExecuteColumnar(): RDD[ColumnarBatch] = {
-    val aggMetrics = GpuHashAggregateMetrics(
+    val aggMetrics = new GpuHashAggregateMetrics(
       numOutputRows = gpuLongMetric(NUM_OUTPUT_ROWS),
       numOutputBatches = gpuLongMetric(NUM_OUTPUT_BATCHES),
       numTasksRepartitioned = gpuLongMetric(NUM_TASKS_REPARTITIONED),
@@ -2019,7 +2007,7 @@ case class GpuHashAggregateExec(
     val aggregateExprs = aggregateExpressions
     val aggregateAttrs = aggregateAttributes
     val resultExprs = resultExpressions
-    val modeInfo = AggregateModeInfo(uniqueModes)
+    val modeInfo = AggregateModeInfo.from(uniqueModes)
     val targetBatchSize = configuredTargetBatchSize
 
     val rdd = child.executeColumnar()
@@ -2213,7 +2201,7 @@ class DynamicGpuPartialAggregateIterator(
       inputIter
     } else {
       val sorter = new GpuSorter(ordering, inputAttrs, allMetrics)
-      GpuOutOfCoreSortIterator(inputIter,
+      new GpuOutOfCoreSortIterator(inputIter,
         sorter,
         configuredTargetBatchSize,
         opTime = metrics.opTime,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuBoundAttribute.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuBoundAttribute.scala
index 3c5b9f26872..6f96496e8fd 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuBoundAttribute.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuBoundAttribute.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -19,7 +19,6 @@ package com.nvidia.spark.rapids
 import ai.rapids.cudf.ast
 import com.nvidia.spark.rapids.shims.ShimExpression
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.{AttributeReference, AttributeSeq, Expression, ExprId, NamedExpression}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.rapids.catalyst.expressions.GpuEquivalentExpressions
@@ -40,7 +39,8 @@ trait GpuBind {
   def bind(input: AttributeSeq): GpuExpression
 }
 
-object GpuBindReferences extends Logging {
+object GpuBindReferences {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
 
   /**
    * An alternative to `Expression.transformDown`, but when a result is returned by `rule` it is
@@ -161,8 +161,9 @@ object GpuBindReferences extends Logging {
         case (es: Seq[Expression], is: AttributeSeq) =>
           es.map(GpuBindReferences.bindGpuReferenceNoMetrics(_, is)).toList
       }
-      logTrace {
-        "INPUT:\n" +
+      if (log.isTraceEnabled) {
+        log.trace(
+          "INPUT:\n" +
           expressions.zipWithIndex.map {
             case (expr, idx) =>
               s"\t$idx:\t$expr"
@@ -175,11 +176,11 @@ object GpuBindReferences extends Logging {
                   case (expr, idx) =>
                     s"\t\t$idx:\t$expr"
                 }.mkString("\n")
-          }.mkString("\n")
+          }.mkString("\n"))
       }
-      GpuTieredProject(tiered)
+      new GpuTieredProject(tiered)
     } else {
-      GpuTieredProject(Seq(GpuBindReferences.bindGpuReferencesNoMetrics(expressions, input)))
+      new GpuTieredProject(Seq(GpuBindReferences.bindGpuReferencesNoMetrics(expressions, input)))
     }
   }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCSVScan.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCSVScan.scala
index 75bd875743f..52c720650d3 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCSVScan.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCSVScan.scala
@@ -31,7 +31,6 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.csv.{CSVOptions, GpuCsvUtils}
@@ -54,7 +53,15 @@ trait ScanWithMetrics {
   var metrics : Map[String, GpuMetric] = Map.empty
 }
 
-object GpuCSVScan extends Logging {
+object GpuCSVScan {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
   private def tryLoadCharset(name: String): Option[Charset] = {
     try {
       Some(Charset.forName(name))
@@ -320,7 +327,7 @@ case class GpuCSVScan(
     val broadcastedConf = sparkSession.sparkContext.broadcast(
       new SerializableConfiguration(hadoopConf))
 
-    GpuCSVPartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
+    new GpuCSVPartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
       dataSchema, readDataSchema, readPartitionSchema, parsedOptions, maxReaderBatchSizeRows,
       maxReaderBatchSizeBytes, maxGpuColumnSizeBytes, metrics, options.asScala.toMap)
   }
@@ -344,7 +351,7 @@ case class GpuCSVScan(
   override def hashCode(): Int = super.hashCode()
 }
 
-case class GpuCSVPartitionReaderFactory(
+class GpuCSVPartitionReaderFactory(
     sqlConf: SQLConf,
     broadcastedConf: Broadcast[SerializableConfiguration],
     dataSchema: StructType,
@@ -356,7 +363,8 @@ case class GpuCSVPartitionReaderFactory(
     maxReaderBatchSizeBytes: Long,
     maxGpuColumnSizeBytes: Long,
     metrics: Map[String, GpuMetric],
-    @transient params: Map[String, String]) extends ShimFilePartitionReaderFactory(params) {
+    @transient params: Map[String, String])
+  extends ShimFilePartitionReaderFactory(params) with Serializable {
 
   override def buildReader(partitionedFile: PartitionedFile): PartitionReader[InternalRow] = {
     throw new IllegalStateException("ROW BASED PARSING IS NOT SUPPORTED ON THE GPU...")
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCast.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCast.scala
index 1328c3b7a1f..4847738b3da 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCast.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCast.scala
@@ -204,6 +204,9 @@ object CastOptions {
 
     override val useHexFormatForBinary: Boolean = true
   }
+
+  private def defaultNullifyOverflows: Boolean =
+    CastTimeToIntShim.ifNullifyOverflows
 }
 
 /**
@@ -223,7 +226,7 @@ class CastOptions(
     legacyCastComplexTypesToString: Boolean,
     ansiMode: Boolean,
     stringToDateAnsiMode: Boolean,
-    val nullifyOverflows: Boolean = CastTimeToIntShim.ifNullifyOverflows,
+    val nullifyOverflows: Boolean = CastOptions.defaultNullifyOverflows,
     val castToJsonString: Boolean = false,
     val ignoreNullFieldsInStructs: Boolean = true,
     val timeZoneId: Option[String] = Option.empty[String]) extends Serializable {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoalesceBatches.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoalesceBatches.scala
index ffa84c5d5d7..bfced5eb03e 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoalesceBatches.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoalesceBatches.scala
@@ -27,7 +27,6 @@ import com.nvidia.spark.rapids.jni.GpuSplitAndRetryOOM
 import com.nvidia.spark.rapids.shims.{ShimExpression, ShimUnaryExecNode}
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression, SortOrder}
@@ -118,7 +117,7 @@ object CoalesceGoal {
         a // They are equal so it does not matter
       } else {
         // Nothing is the same so there is no guarantee
-        BatchedByKey(Seq.empty)(Seq.empty)
+        new BatchedByKey(Seq.empty)(Seq.empty)
       }
     case (TargetSize(aSize), TargetSize(bSize)) if aSize > bSize => a
     case _ => b
@@ -144,9 +143,9 @@ object CoalesceGoal {
     case (_, _: RequireSingleBatchLike) => false
     case (_: BatchedByKey, _: TargetSize) => true
     case (_: TargetSize, _: BatchedByKey) => false
-    case (BatchedByKey(aOrder), BatchedByKey(bOrder)) =>
-      aOrder.length == bOrder.length &&
-          aOrder.zip(bOrder).forall {
+    case (aGoal: BatchedByKey, bGoal: BatchedByKey) =>
+      aGoal.gpuOrder.length == bGoal.gpuOrder.length &&
+          aGoal.gpuOrder.zip(bGoal.gpuOrder).forall {
             case (a, b) => a.satisfies(b)
           }
     case (TargetSize(foundSize), TargetSize(requiredSize)) => foundSize >= requiredSize
@@ -236,10 +235,28 @@ case class TargetSize(override val targetSizeBytes: Long)
  * @param gpuOrder the GPU keys that should be used for batching.
  * @param cpuOrder the CPU keys that should be used for batching.
  */
-case class BatchedByKey(gpuOrder: Seq[SortOrder])(val cpuOrder: Seq[SortOrder])
-    extends CoalesceGoal {
+class BatchedByKey(val gpuOrder: Seq[SortOrder])(val cpuOrder: Seq[SortOrder])
+    extends CoalesceGoal with Serializable {
   require(gpuOrder.size == cpuOrder.size)
 
+  override def canEqual(that: Any): Boolean = that.isInstanceOf[BatchedByKey]
+
+  override def productArity: Int = 1
+
+  override def productElement(n: Int): Any = n match {
+    case 0 => gpuOrder
+    case _ => throw new IndexOutOfBoundsException(n.toString)
+  }
+
+  override def productPrefix: String = "BatchedByKey"
+
+  override def equals(other: Any): Boolean = other match {
+    case that: BatchedByKey => that.canEqual(this) && gpuOrder == that.gpuOrder
+    case _ => false
+  }
+
+  override def hashCode(): Int = scala.runtime.ScalaRunTime._hashCode(this)
+
   override def otherCopyArgs: Seq[AnyRef] = cpuOrder :: Nil
 
   override def children: Seq[Expression] = gpuOrder
@@ -267,7 +284,20 @@ abstract class AbstractGpuCoalesceIterator(
     streamTimeOrNoop: GpuMetric,
     concatTime: GpuMetric,
     opTime: GpuMetric,
-    opName: String) extends Iterator[ColumnarBatch] with Logging {
+    opName: String) extends Iterator[ColumnarBatch] {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  protected def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  protected def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
 
   val streamTime = streamTimeOrNoop match {
     case NoopMetric => new LocalGpuMetric
@@ -507,7 +537,7 @@ abstract class AbstractGpuCoalesceIterator(
                 case RequireSingleBatchWithFilter(filterExpression) =>
                   if (inputFilterTier.isEmpty) {
                     // We are going to enter the null-filtering mode
-                    val filterTier = GpuTieredProject(Seq(Seq(filterExpression)))
+                    val filterTier = new GpuTieredProject(Seq(Seq(filterExpression)))
                     // 1) Filter what we had already stored, and the rows number should
                     //    be within the limit.
                     // Re-calculate the filtered rows number and size.
@@ -693,7 +723,7 @@ abstract class AbstractGpuCoalesceIterator(
           throw new GpuSplitAndRetryOOM(s"Cannot split a sequence of $numBatches batches")
         }
         val res = it.splitAt(numBatches / 2)
-        Seq(BatchesToCoalesce(res._1), BatchesToCoalesce(res._2))
+        Seq(new BatchesToCoalesce(res._1), new BatchesToCoalesce(res._2))
       }
     }
   }
@@ -706,7 +736,7 @@ abstract class AbstractGpuCoalesceIterator(
  * instances in `batches`
  * @param batches a sequence of `SpillableColumnarBatch` to manage.
  */
-case class BatchesToCoalesce(batches: Array[SpillableColumnarBatch])
+class BatchesToCoalesce(val batches: Array[SpillableColumnarBatch])
     extends AutoCloseable {
   override def close(): Unit = {
     batches.safeClose()
@@ -766,7 +796,7 @@ class GpuCoalesceIterator(iter: Iterator[ColumnarBatch],
   }
 
   override def getCoalesceRetryIterator: Iterator[ColumnarBatch] = {
-    val candidates = BatchesToCoalesce(batches.clone().toArray)
+    val candidates = new BatchesToCoalesce(batches.clone().toArray)
     batches.clear()
     withRetry(candidates, splitBatchesToCoalesceFn) { attempt: BatchesToCoalesce =>
       concatBatches(attempt.batches)
@@ -888,7 +918,7 @@ class GpuCompressionAwareCoalesceIterator(
   }
 
   override def getCoalesceRetryIterator: Iterator[ColumnarBatch] = {
-    val candidates = BatchesToCoalesce(batches.clone().toArray)
+    val candidates = new BatchesToCoalesce(batches.clone().toArray)
     batches.clear()
     withRetry(candidates, splitBatchesToCoalesceFn) { attempt: BatchesToCoalesce =>
       concatBatches(attempt.batches)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuColumnarBatchSerializer.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuColumnarBatchSerializer.scala
index cfeebcdcede..6fb68704339 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuColumnarBatchSerializer.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuColumnarBatchSerializer.scala
@@ -694,7 +694,7 @@ object KudoSerializedTableColumn {
    * @return columnar batch to be passed to [[GpuShuffleCoalesceExec]]
    */
   def from(header: KudoTableHeader, hostBuffer: HostMemoryBuffer): ColumnarBatch = {
-    val kudoTable = SpillableKudoTable(header, hostBuffer)
+    val kudoTable = SpillableKudoTable.from(header, hostBuffer)
     val column = new KudoSerializedTableColumn(kudoTable)
     new ColumnarBatch(Array(column), kudoTable.header.getNumRows)
   }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoreDumpHandler.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoreDumpHandler.scala
index 77c9a9987e8..0ade942599e 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoreDumpHandler.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCoreDumpHandler.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -29,13 +29,32 @@ import org.apache.hadoop.fs.permission.{FsAction, FsPermission}
 
 import org.apache.spark.SparkContext
 import org.apache.spark.api.plugin.PluginContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.util.SerializableConfiguration
 
-object GpuCoreDumpHandler extends Logging {
+object GpuCoreDumpHandler {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    log.warn(msg, throwable)
+  }
+
+  private def logError(msg: => String): Unit = {
+    log.error(msg)
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    log.error(msg, throwable)
+  }
+
   private var executor: Option[ExecutorService] = None
   private var dumpedPath: Option[String] = None
   private var namedPipeFile: File = _
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCpuBridgeExpression.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCpuBridgeExpression.scala
index 76bfcea0970..7d4eab33694 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCpuBridgeExpression.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuCpuBridgeExpression.scala
@@ -21,7 +21,6 @@ import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 import com.nvidia.spark.rapids.shims.ShimExpression
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{AttributeSeq, Expression}
 import org.apache.spark.sql.rapids.BridgeUnsafeProjection
@@ -47,8 +46,16 @@ case class GpuCpuBridgeExpression(
     gpuInputs: Seq[Expression],
     cpuExpression: Expression,
     outputDataType: DataType,
-    outputNullable: Boolean) extends GpuExpression with ShimExpression 
-    with Logging with GpuBind with GpuMetricsInjectable {
+    outputNullable: Boolean) extends GpuExpression with ShimExpression
+    with GpuBind with GpuMetricsInjectable {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   override def children: Seq[Expression] = gpuInputs ++ Seq(cpuExpression)
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDataWritingCommandExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDataWritingCommandExec.scala
index 0f4af3f0ca2..a6d49b8bd14 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDataWritingCommandExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDataWritingCommandExec.scala
@@ -21,43 +21,32 @@ import java.net.URI
 import com.nvidia.spark.rapids.RapidsConf.LORE_SKIP_DUMPING_PLAN
 import com.nvidia.spark.rapids.lore.{GpuLore, GpuLoreDumpExec}
 import com.nvidia.spark.rapids.lore.GpuLore.{loreIdOf, LORE_DUMP_PATH_TAG, LORE_DUMP_RDD_TAG}
-import com.nvidia.spark.rapids.shims.{ShimUnaryCommand, ShimUnaryExecNode}
+import com.nvidia.spark.rapids.shims.{ShimDataWritingCommand, ShimUnaryExecNode}
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkContext
 import org.apache.spark.rdd.RDD
-import org.apache.spark.sql.{Row, SaveMode}
+import org.apache.spark.sql.SaveMode
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Attribute
 import org.apache.spark.sql.execution.{SparkPlan, SQLExecution}
-import org.apache.spark.sql.execution.command.DataWritingCommand
 import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.rapids.GpuWriteJobStatsTracker
 import org.apache.spark.sql.rapids.shims.RapidsErrorUtils
-import org.apache.spark.sql.rapids.shims.TrampolineConnectShims.SparkSession
 import org.apache.spark.sql.vectorized.ColumnarBatch
 import org.apache.spark.util.SerializableConfiguration
 
 /**
  * An extension of `DataWritingCommand` that allows columnar execution.
  */
-trait GpuDataWritingCommand extends DataWritingCommand with ShimUnaryCommand {
+trait GpuDataWritingCommand extends ShimDataWritingCommand {
   lazy val basicMetrics: Map[String, GpuMetric] = GpuWriteJobStatsTracker.basicMetrics
   lazy val taskMetrics: Map[String, GpuMetric] = GpuWriteJobStatsTracker.taskMetrics
 
   override lazy val metrics: Map[String, SQLMetric] = GpuMetric.unwrap(basicMetrics ++ taskMetrics)
 
-  def run(sparkSession: SparkSession, child: SparkPlan): Seq[Row] = {
-    Arm.withResource(runColumnar(sparkSession, child)) { batches =>
-      assert(batches.isEmpty)
-    }
-    Seq.empty[Row]
-  }
-
-  def runColumnar(sparkSession: SparkSession, child: SparkPlan): Seq[ColumnarBatch]
-
   def gpuWriteJobStatsTracker(
       hadoopConf: Configuration): GpuWriteJobStatsTracker = {
     val serializableHadoopConf = new SerializableConfiguration(hadoopConf)
@@ -122,7 +111,7 @@ case class GpuDataWritingCommandExec(cmd: GpuDataWritingCommand, child: SparkPla
     dumpLoreMetaInfo()
     // Execute the command with LoRE dumping if needed
     val childWithDumping = dumpLoreRDD(child)
-    cmd.runColumnar(sparkSession, childWithDumping)
+    cmd.runColumnarFromAny(sparkSession, childWithDumping)
   }
 
   override def output: Seq[Attribute] = cmd.output
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDeviceManager.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDeviceManager.scala
index e2674b1b7f0..822b9c3fee2 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDeviceManager.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuDeviceManager.scala
@@ -27,7 +27,6 @@ import com.nvidia.spark.rapids.jni.RmmSpark
 import com.nvidia.spark.rapids.spill.SpillFramework
 
 import org.apache.spark.{SparkConf, SparkEnv, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.network.util.ByteUnit
 import org.apache.spark.resource.ResourceInformation
 import org.apache.spark.sql.internal.SQLConf
@@ -38,7 +37,29 @@ private case object Initialized extends MemoryState
 private case object Uninitialized extends MemoryState
 private case object Errored extends MemoryState
 
-object GpuDeviceManager extends Logging {
+object GpuDeviceManager {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
+  private def logError(msg: => String): Unit = {
+    log.error(msg)
+  }
+
   // This config controls whether RMM/Pinned memory are initialized from the task
   // or from the executor side plugin. The default is to initialize from the
   // executor plugin.
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuExec.scala
index 609b17d44ea..23cf056c813 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuExec.scala
@@ -26,6 +26,7 @@ import org.apache.spark.{Partition, TaskContext}
 import org.apache.spark.internal.Logging
 import org.apache.spark.rapids.LocationPreservingMapPartitionsRDD
 import org.apache.spark.rdd.RDD
+import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.expressions.{Alias, AttributeReference, Expression, ExprId}
 import org.apache.spark.sql.catalyst.plans.QueryPlan
 import org.apache.spark.sql.catalyst.trees.TreeNodeTag
@@ -35,8 +36,6 @@ import org.apache.spark.sql.execution.exchange.{Exchange, ReusedExchangeExec}
 import org.apache.spark.sql.execution.metric.SQLMetric
 import org.apache.spark.sql.rapids.GpuTaskMetrics
 import org.apache.spark.sql.rapids.execution.{GpuCustomShuffleReaderExec}
-import org.apache.spark.sql.rapids.shims.SparkSessionUtils
-import org.apache.spark.sql.rapids.shims.TrampolineConnectShims.SparkSession
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
 /**
@@ -95,7 +94,50 @@ class GpuOpTimeTrackingRDD[T: scala.reflect.ClassTag](
     firstParent[T].preferredLocations(split)
 }
 
+trait RapidsLocalLog {
+  @transient private lazy val rapidsLocalLog = org.slf4j.LoggerFactory.getLogger(
+    getClass.getName.stripSuffix("$"))
+
+  protected def logTrace(msg: => String): Unit = {
+    if (rapidsLocalLog.isTraceEnabled) rapidsLocalLog.trace(msg)
+  }
+
+  protected def logDebug(msg: => String): Unit = {
+    if (rapidsLocalLog.isDebugEnabled) rapidsLocalLog.debug(msg)
+  }
+
+  protected def logDebug(msg: => String, throwable: Throwable): Unit = {
+    if (rapidsLocalLog.isDebugEnabled) rapidsLocalLog.debug(msg, throwable)
+  }
+
+  protected def logInfo(msg: => String): Unit = {
+    if (rapidsLocalLog.isInfoEnabled) rapidsLocalLog.info(msg)
+  }
+
+  protected def logWarning(msg: => String): Unit = {
+    if (rapidsLocalLog.isWarnEnabled) rapidsLocalLog.warn(msg)
+  }
+
+  protected def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (rapidsLocalLog.isWarnEnabled) rapidsLocalLog.warn(msg, throwable)
+  }
+
+  protected def logError(msg: => String): Unit = {
+    if (rapidsLocalLog.isErrorEnabled) rapidsLocalLog.error(msg)
+  }
+
+  protected def logError(msg: => String, throwable: Throwable): Unit = {
+    if (rapidsLocalLog.isErrorEnabled) rapidsLocalLog.error(msg, throwable)
+  }
+}
+
 object GpuExec {
+  @transient private[this] lazy val sparkPlanSessionMethod =
+    classOf[SparkPlan].getMethod("session")
+
+  def sessionFromPlan(plan: SparkPlan): SparkSession =
+    sparkPlanSessionMethod.invoke(plan).asInstanceOf[SparkSession]
+
   def outputBatching(sp: SparkPlan): CoalesceGoal = sp match {
     case gpu: GpuExec => gpu.outputBatching
     case _ => null
@@ -111,7 +153,7 @@ trait GpuExec extends SparkPlan with Logging {
     RapidsConf.OP_TIME_TRACKING_RDD_ENABLED.get(conf)
 
   def sparkSession: SparkSession = {
-    SparkSessionUtils.sessionFromPlan(this)
+    GpuExec.sessionFromPlan(this)
   }
 
   /**
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuGetJsonObject.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuGetJsonObject.scala
index bd6760f6765..8287f37dce8 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuGetJsonObject.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuGetJsonObject.scala
@@ -280,7 +280,7 @@ class GetJsonObjectCombiner(private val exp: GpuGetJsonObject) extends GpuExpres
   override def addExpression(e: Expression): Unit = {
     val localOutputLocation = outputLocation
     outputLocation += 1
-    val key = GpuExpressionEquals(e)
+    val key = new GpuExpressionEquals(e)
     if (!toCombine.contains(key)) {
       toCombine.put(key, localOutputLocation)
     }
@@ -329,7 +329,7 @@ class GetJsonObjectCombiner(private val exp: GpuGetJsonObject) extends GpuExpres
   }
 
   override def getReplacementExpression(e: Expression): Option[Expression] = {
-    toCombine.get(GpuExpressionEquals(e)).map { localId =>
+    toCombine.get(new GpuExpressionEquals(e)).map { localId =>
       GpuGetStructField(multiGet, localId, Some(fieldName(localId)))
     }
   }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuHashPartitioningBase.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuHashPartitioningBase.scala
index 226ed0d381b..d536cb1980b 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuHashPartitioningBase.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuHashPartitioningBase.scala
@@ -20,7 +20,6 @@ import ai.rapids.cudf.{DType, PartitionedTable}
 import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.shims.ShimExpression
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.{Expression, HiveHash, Murmur3Hash}
 import org.apache.spark.sql.catalyst.plans.physical.HashPartitioning
 import org.apache.spark.sql.rapids.{GpuHashExpression, GpuHiveHash, GpuMurmur3Hash, GpuPmod}
@@ -95,7 +94,16 @@ abstract class GpuHashPartitioningBase(expressions: Seq[Expression], numPartitio
   def partitionIdExpression: GpuExpression = GpuPmod(hashFunc, GpuLiteral(numPartitions))
 }
 
-object GpuHashPartitioningBase extends Logging {
+object GpuHashPartitioningBase {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(GpuHashPartitioningBase.getClass)
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   val DEFAULT_HASH_SEED: Int = 42
 
@@ -117,7 +125,7 @@ object GpuHashPartitioningBase extends Logging {
         hashMode = hashModeMethod.invoke(cpuHp) match {
           case m if m == classOf[Murmur3Hash] => Murmur3Mode
           case h if h == classOf[HiveHash] => HiveMode
-          case o => UnsupportedMode(o.asInstanceOf[Class[_]].getSimpleName)
+          case o => new UnsupportedMode(o.asInstanceOf[Class[_]].getSimpleName)
         }
         logDebug(s"Found hash function '$hashMode' from CPU hash partitioning.")
       } catch {
@@ -134,6 +142,6 @@ sealed trait HashMode extends Serializable
 
 case object Murmur3Mode extends HashMode
 case object HiveMode extends HashMode
-case class UnsupportedMode(modeName: String) extends HashMode {
+class UnsupportedMode(val modeName: String) extends HashMode {
   override def toString: String = modeName
 }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuInSet.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuInSet.scala
index 55df29f3454..e116d85b311 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuInSet.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuInSet.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,14 +18,15 @@ package com.nvidia.spark.rapids
 
 import ai.rapids.cudf.{ColumnVector, DType, Scalar}
 import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
+import com.nvidia.spark.rapids.shims.ShimPredicate
 
-import org.apache.spark.sql.catalyst.expressions.{Expression, Literal, Predicate}
+import org.apache.spark.sql.catalyst.expressions.{Expression, Literal}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.types.{DoubleType, FloatType}
 
 case class GpuInSet(
     child: Expression,
-    list: Seq[Any]) extends GpuUnaryExpression with Predicate {
+    list: Seq[Any]) extends GpuUnaryExpression with ShimPredicate {
   require(list != null, "list should not be null")
 
   @transient private[this] lazy val hasNull: Boolean = list.contains(null)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuListUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuListUtils.scala
deleted file mode 100644
index b351e376007..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuListUtils.scala
+++ /dev/null
@@ -1,56 +0,0 @@
-/*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import java.util.Optional
-
-import ai.rapids.cudf.{ColumnView, DType}
-import com.nvidia.spark.rapids.Arm.withResource
-
-/**
- * Provide a set of APIs to manipulate array/list columns in common ways.
- */
-object GpuListUtils {
-  /**
-   * Replace the data column in a LIST column. This will keep the same offsets and validity
-   * of the listColumn.  This returns a view so it is the responsibility of the caller to keep
-   * both listCol and newDataCol alive longer than the returned ColumnView.
-   * @param listCol the list column to use as a template
-   * @param newDataCol the new data column.
-   * @return a new ColumnView.
-   * @throws scala.IllegalArgumentException if data column does not match the original data column
-   *                                        in size.
-   */
-  def replaceListDataColumnAsView(
-      listCol: ColumnView,
-      newDataCol: ColumnView): ColumnView = {
-    assert(DType.LIST.equals(listCol.getType))
-    withResource(listCol.getChildColumnView(0)) { dataCol =>
-      if (dataCol.getRowCount != newDataCol.getRowCount) {
-        throw new scala.IllegalArgumentException(
-          "Mismatch in the number of rows in the data columns")
-      }
-    }
-    withResource(listCol.getOffsets) { offsets =>
-      withResource(listCol.getValid) { validity =>
-        new ColumnView(DType.LIST, listCol.getRowCount,
-          Optional.of[java.lang.Long](listCol.getNullCount), validity, offsets,
-          Array[ColumnView](newDataCol))
-      }
-    }
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMapUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMapUtils.scala
index 1de3b50de3b..e8dd755c82d 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMapUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMapUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -177,7 +177,7 @@ object GpuMapUtils {
 
 }
 
-case class GpuMapFromArraysMeta(expr: MapFromArrays,
+class GpuMapFromArraysMeta(expr: MapFromArrays,
                                 override val conf: RapidsConf,
                                 override val parent: Option[RapidsMeta[_, _, _]],
                                 rule: DataFromReplacementRule)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMetrics.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMetrics.scala
index f6ae2bbbe8e..2065bf7b375 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMetrics.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMetrics.scala
@@ -21,7 +21,6 @@ import scala.collection.immutable.TreeMap
 import com.nvidia.spark.rapids.metrics.GpuBubbleTimerManager
 
 import org.apache.spark.{SparkContext, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.execution.metric.{SQLMetric, SQLMetrics}
@@ -86,7 +85,7 @@ class GpuMetricFactory(metricsConf: MetricsLevel, context: SparkContext) {
     createInternal(level, SQLMetrics.createTimingMetric(context, name))
 }
 
-object GpuMetric extends Logging {
+object GpuMetric {
   // Metric names.
   val BUFFER_TIME = "bufferTime"
   val BUFFER_TIME_BUBBLE = "bufferTimeBubble"
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMultiFileReader.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMultiFileReader.scala
index 892e151594e..cf73e368989 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMultiFileReader.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuMultiFileReader.scala
@@ -40,7 +40,6 @@ import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.{SparkEnv, TaskContext}
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.connector.read.{InputPartition, PartitionReader, PartitionReaderFactory}
 import org.apache.spark.sql.execution.QueryExecutionException
@@ -185,7 +184,19 @@ trait MultiFileReaderFunctions {
 
 // Singleton thread pool used across all tasks for multifile reading.
 // Please note that the TaskContext is not set in these threads and should not be used.
-object MultiFileReaderThreadPool extends Logging {
+object MultiFileReaderThreadPool {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
   @volatile
   private var threadPool: Option[ThreadPoolExecutor] = None
 
@@ -296,7 +307,7 @@ abstract class MultiFilePartitionReaderFactoryBase(
     @transient sqlConf: SQLConf,
     broadcastedConf: Broadcast[SerializableConfiguration],
     @transient rapidsConf: RapidsConf)
-  extends PartitionReaderFactory with Logging {
+  extends PartitionReaderFactory with RapidsLocalLog {
 
   protected val maxReadBatchSizeRows: Int = rapidsConf.maxReadBatchSizeRows
   protected val maxReadBatchSizeBytes: Long = rapidsConf.maxReadBatchSizeBytes
@@ -388,7 +399,7 @@ abstract class MultiFilePartitionReaderFactoryBase(
  * @param execMetrics metrics
  */
 abstract class FilePartitionReaderBase(conf: Configuration, execMetrics: Map[String, GpuMetric])
-    extends PartitionReader[ColumnarBatch] with Logging with ScanWithMetrics {
+    extends PartitionReader[ColumnarBatch] with RapidsLocalLog with ScanWithMetrics {
 
   metrics = execMetrics
 
@@ -405,42 +416,25 @@ abstract class FilePartitionReaderBase(conf: Configuration, execMetrics: Map[Str
   }
 }
 
-case class CombineConf(
-    combineThresholdSize: Long, // The size to combine to when combining small files
-    combineWaitTime: Int) // The amount of time to wait for other files ready for combination.
-
-// TODO: Refactor thread pool components into a common utility, since it is not specific to
-//  multi-file reading.
-trait ThreadPoolConf {
-  /**
-   * The maximum number of threads used by the thread pool, not necessarily the final number
-   */
-  def maxThreadNumber: Int
-
-  /**
-   * Whether to create pools for each Spark stage, only for testing for now
-   */
-  def stageLevelPool: Boolean
-}
-
-case class DefaultThreadPoolConf(
-    maxThreadNumber: Int,
-    stageLevelPool: Boolean) extends ThreadPoolConf
-
-case class MemoryBoundedPoolConf(
-    maxThreadNumber: Int,
-    stageLevelPool: Boolean,
-    memoryCapacity: Long, // The maximum host memory being used in bytes, must be > 0
-    waitMemTimeoutMs: Long // The timeout for acquiring host memory in milliseconds
-) extends ThreadPoolConf
-
 class ThreadPoolConfBuilder(
     private val maxThreadNumber: Int,
     private val isMemoryBounded: Boolean,
     private val memoryCapacityFromDriver: Long,
     private val timeoutMs: Long,
     private val stageLevelPool: Boolean
-) extends Logging with Serializable {
+) extends Serializable {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
 
   // Finalize the ThreadPoolConf, which mainly determines the memory capacity of the
   // ResourceBoundedThreadExecutor if isMemoryBounded is true.
@@ -452,7 +446,7 @@ class ThreadPoolConfBuilder(
   // 3. if still not set, use the default value `DEFAULT_MEMORY_CAPACITY`.
   def build(): ThreadPoolConf = {
     if (!isMemoryBounded) {
-      DefaultThreadPoolConf(maxThreadNumber, stageLevelPool)
+      new DefaultThreadPoolConf(maxThreadNumber, stageLevelPool)
     } else {
       val memCap: Long = if (memoryCapacityFromDriver > 0) {
         memoryCapacityFromDriver
@@ -468,11 +462,7 @@ class ThreadPoolConfBuilder(
         }
       }
       logDebug(s"Setting memory capacity for ResourcePoolConf to ${memCap >> 20}MB")
-      MemoryBoundedPoolConf(
-        maxThreadNumber = maxThreadNumber,
-        stageLevelPool = stageLevelPool,
-        memoryCapacity = memCap,
-        waitMemTimeoutMs = timeoutMs)
+      new MemoryBoundedPoolConf(maxThreadNumber, stageLevelPool, memCap, timeoutMs)
     }
   }
 }
@@ -523,7 +513,7 @@ abstract class MultiFileCloudPartitionReaderBase(
     maxReadBatchSizeBytes: Long,
     ignoreCorruptFiles: Boolean = false,
     keepReadsInOrder: Boolean = true,
-    combineConf: CombineConf = CombineConf(-1, -1))
+    combineConf: CombineConf = new CombineConf(-1, -1))
   extends FilePartitionReaderBase(conf, execMetrics) {
 
   protected type BufferInfo = HostMemoryBuffersWithMetaDataBase
@@ -1142,13 +1132,21 @@ abstract class MultiFileCoalescingPartitionReaderBase(
     }
   }
 
-  protected case class CurrentChunkMeta(
-    clippedSchema: SchemaBase,
-    readSchema: StructType,
-    currentChunk: FileMajorBlockChunk,
-    extraInfo: ExtraInfo) {
+  protected class CurrentChunkMeta(
+    val clippedSchema: SchemaBase,
+    val readSchema: StructType,
+    val currentChunk: FileMajorBlockChunk,
+    val extraInfo: ExtraInfo) {
     def rowsPerPartition: Array[Long] = currentChunk.rowsPerPartition
     def allPartValues: Array[InternalRow] = currentChunk.allPartValues
+
+    def copy(
+        clippedSchema: SchemaBase = this.clippedSchema,
+        readSchema: StructType = this.readSchema,
+        currentChunk: FileMajorBlockChunk = this.currentChunk,
+        extraInfo: ExtraInfo = this.extraInfo): CurrentChunkMeta = {
+      new CurrentChunkMeta(clippedSchema, readSchema, currentChunk, extraInfo)
+    }
   }
 
   /**
@@ -1609,6 +1607,6 @@ abstract class MultiFileCoalescingPartitionReaderBase(
     logDebug(s"Loaded $numRows rows from ${getFileFormatShortName}. " +
       s"${getFileFormatShortName} bytes read: $numChunkBytes. Estimated GPU bytes: $numBytes. " +
       s"Number of partition entries: ${fileMajorChunk.allPartValues.length}")
-    CurrentChunkMeta(currentClippedSchema, currentReadSchema, fileMajorChunk, extraInfo)
+    new CurrentChunkMeta(currentClippedSchema, currentReadSchema, fileMajorChunk, extraInfo)
   }
 }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcScan.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcScan.scala
index bc246a152f6..52c909f1ad9 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcScan.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcScan.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,7 +18,7 @@ package com.nvidia.spark.rapids
 
 import java.io.{ByteArrayInputStream, FileNotFoundException, IOException, OutputStream}
 import java.net.URI
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 import java.nio.channels.Channels
 import java.nio.charset.StandardCharsets
 import java.time.ZoneId
@@ -39,6 +39,7 @@ import com.nvidia.spark.rapids.RmmRapidsRetryIterator.withRetryNoSplit
 import com.nvidia.spark.rapids.SchemaUtils._
 import com.nvidia.spark.rapids.filecache.FileCache
 import com.nvidia.spark.rapids.fileio.hadoop.HadoopFileIO
+import com.nvidia.spark.rapids.fileio.hadoop.PerfIOHadoopInputFileFactory
 import com.nvidia.spark.rapids.io.async._
 import com.nvidia.spark.rapids.jni.{CastStrings, RmmSpark}
 import com.nvidia.spark.rapids.shims.{ColumnDefaultValuesShims, GpuOrcDataReader, NullOutputStreamShim, OrcCastingShims, OrcReadingShims, OrcShims, ShimFilePartitionReaderFactory}
@@ -55,7 +56,6 @@ import org.apache.orc.mapred.OrcInputFormat
 
 import org.apache.spark.TaskContext
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Expression
@@ -88,7 +88,7 @@ case class GpuOrcScan(
     dataFilters: Seq[Expression],
     rapidsConf: RapidsConf,
     queryUsesInputFile: Boolean = false)
-  extends FileScan with GpuScan with Logging {
+  extends FileScan with GpuScan {
 
   override def isSplitable(path: Path): Boolean = true
 
@@ -101,12 +101,12 @@ case class GpuOrcScan(
 
     if (rapidsConf.isOrcPerFileReadEnabled) {
       logInfo("Using the original per file orc reader")
-      GpuOrcPartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
+      new GpuOrcPartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
         dataSchema, readDataSchema, readPartitionSchema, pushedFilters, rapidsConf, metrics,
         options.asScala.toMap)
     } else {
       val poolConfBuilder = ThreadPoolConfBuilder(rapidsConf)
-      GpuOrcMultiFilePartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
+      new GpuOrcMultiFilePartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
         dataSchema, readDataSchema, readPartitionSchema, pushedFilters, rapidsConf,
         poolConfBuilder,
         metrics, queryUsesInputFile)
@@ -578,7 +578,7 @@ object GpuOrcScan {
  *                            off in GpuTransitionOverrides if InputFileName,
  *                            InputFileBlockStart, or InputFileBlockLength are used
  */
-case class GpuOrcMultiFilePartitionReaderFactory(
+class GpuOrcMultiFilePartitionReaderFactory(
     @transient sqlConf: SQLConf,
     broadcastedConf: Broadcast[SerializableConfiguration],
     dataSchema: StructType,
@@ -589,7 +589,8 @@ case class GpuOrcMultiFilePartitionReaderFactory(
     poolConfBuilder: ThreadPoolConfBuilder,
     metrics: Map[String, GpuMetric],
     queryUsesInputFile: Boolean)
-  extends MultiFilePartitionReaderFactoryBase(sqlConf, broadcastedConf, rapidsConf) {
+  extends MultiFilePartitionReaderFactoryBase(sqlConf, broadcastedConf, rapidsConf)
+      with Serializable {
 
   private val debugDumpPrefix = rapidsConf.orcDebugDumpPrefix
   private val debugDumpAlways = rapidsConf.orcDebugDumpAlways
@@ -619,7 +620,7 @@ case class GpuOrcMultiFilePartitionReaderFactory(
    */
   override def buildBaseColumnarReaderForCloud(files: Array[PartitionedFile], conf: Configuration):
       PartitionReader[ColumnarBatch] = {
-    val combineConf = CombineConf(combineThresholdSize, combineWaitTime)
+    val combineConf = new CombineConf(combineThresholdSize, combineWaitTime)
     val poolConf = poolConfBuilder.build()
     val reader = new MultiFileCloudOrcPartitionReader(
       conf, files, dataSchema, readDataSchema, partitionSchema,
@@ -658,13 +659,13 @@ case class GpuOrcMultiFilePartitionReaderFactory(
           compressionAndStripes.getOrElseUpdate(orcPartitionReaderContext.compressionKind,
             new ArrayBuffer[OrcSingleStripeMeta]) ++=
             orcPartitionReaderContext.blockIterator.map(block =>
-              OrcSingleStripeMeta(
+              new OrcSingleStripeMeta(
                 orcPartitionReaderContext.filePath,
-                OrcDataStripe(OrcStripeWithMeta(block, orcPartitionReaderContext)),
+                new OrcDataStripe(new OrcStripeWithMeta(block, orcPartitionReaderContext)),
                 file.partitionValues,
-                OrcSchemaWrapper(orcPartitionReaderContext.updatedReadSchema),
+                new OrcSchemaWrapper(orcPartitionReaderContext.updatedReadSchema),
                 readDataSchema,
-                OrcExtraInfo(orcPartitionReaderContext.requestedMapping)))
+                new OrcExtraInfo(orcPartitionReaderContext.requestedMapping)))
         }
       }
     }
@@ -687,7 +688,7 @@ case class GpuOrcMultiFilePartitionReaderFactory(
   override final def getFileFormatShortName: String = "ORC"
 }
 
-case class GpuOrcPartitionReaderFactory(
+class GpuOrcPartitionReaderFactory(
     @transient sqlConf: SQLConf,
     broadcastedConf: Broadcast[SerializableConfiguration],
     dataSchema: StructType,
@@ -697,7 +698,7 @@ case class GpuOrcPartitionReaderFactory(
     @transient rapidsConf: RapidsConf,
     metrics : Map[String, GpuMetric],
     @transient params: Map[String, String])
-  extends ShimFilePartitionReaderFactory(params) {
+  extends ShimFilePartitionReaderFactory(params) with Serializable {
 
   private val isCaseSensitive = sqlConf.caseSensitiveAnalysis
   private val debugDumpPrefix = rapidsConf.orcDebugDumpPrefix
@@ -754,10 +755,10 @@ case class GpuOrcPartitionReaderFactory(
  * @param footer stripe footer
  * @param inputDataRanges input file ranges (based at file offset 0) of stripe data
  */
-case class OrcOutputStripe(
-    infoBuilder: OrcProto.StripeInformation.Builder,
-    footer: OrcProto.StripeFooter,
-    inputDataRanges: DiskRangeList)
+class OrcOutputStripe(
+    val infoBuilder: OrcProto.StripeInformation.Builder,
+    val footer: OrcProto.StripeFooter,
+    val inputDataRanges: DiskRangeList) extends Serializable
 
 /**
  * This class holds fields needed to read and iterate over the OrcFile
@@ -775,18 +776,18 @@ case class OrcOutputStripe(
  * @param blockIterator an iterator over the ORC output stripes
  * @param requestedMapping the optional requested column ids
  */
-case class OrcPartitionReaderContext(
-    filePath: Path,
-    conf: Configuration,
-    fileSchema: TypeDescription,
-    updatedReadSchema: TypeDescription,
-    evolution: SchemaEvolution,
-    fileTail: OrcProto.FileTail,
-    compressionSize: Int,
-    compressionKind: CompressionKind,
-    readerOpts: Reader.Options,
-    blockIterator: BufferedIterator[OrcOutputStripe],
-    requestedMapping: Option[Array[Int]])
+class OrcPartitionReaderContext(
+    val filePath: Path,
+    val conf: Configuration,
+    val fileSchema: TypeDescription,
+    val updatedReadSchema: TypeDescription,
+    val evolution: SchemaEvolution,
+    val fileTail: OrcProto.FileTail,
+    val compressionSize: Int,
+    val compressionKind: CompressionKind,
+    val readerOpts: Reader.Options,
+    val blockIterator: BufferedIterator[OrcOutputStripe],
+    val requestedMapping: Option[Array[Int]]) extends Serializable
 
 case class OrcBlockMetaForSplitCheck(
     filePath: Path,
@@ -1033,8 +1034,8 @@ trait OrcCommonFunctions extends OrcCodecWritingHelper { self: FilePartitionRead
 /**
  * A base ORC partition reader which compose of some common methods
  */
-trait OrcPartitionReaderBase extends OrcCommonFunctions with Logging
-  with ScanWithMetrics { self: FilePartitionReaderBase =>
+trait OrcPartitionReaderBase extends OrcCommonFunctions
+  with RapidsLocalLog with ScanWithMetrics { self: FilePartitionReaderBase =>
 
   def populateCurrentBlockChunk(
       blockIterator: BufferedIterator[OrcOutputStripe],
@@ -1467,7 +1468,8 @@ private case class GpuOrcFileFilterHandler(
         sargApp, sargColumns, OrcConf.IGNORE_NON_UTF8_BLOOM_FILTERS.getBoolean(conf),
         orcReader.getWriterVersion, updatedReadSchema,
         resolveMemFileIncluded(fileIncluded, requestedMapping))
-      OrcPartitionReaderContext(filePath, conf, orcReader.getSchema, updatedReadSchema, evolution,
+      new OrcPartitionReaderContext(
+        filePath, conf, orcReader.getSchema, updatedReadSchema, evolution,
         orcReader.getFileTail, orcReader.getCompressionSize, orcReader.getCompressionKind,
         readerOpts, stripes.iterator.buffered, requestedMapping)
     }
@@ -1611,7 +1613,7 @@ private case class GpuOrcFileFilterHandler(
         .setDataLength(outputStripeDataLength)
         .setNumberOfRows(inputStripe.getNumberOfRows)
 
-      OrcOutputStripe(infoBuilder, outputStripeFooter, rangeCreator.get)
+      new OrcOutputStripe(infoBuilder, outputStripeFooter, rangeCreator.get)
     }
 
     /**
@@ -1790,7 +1792,9 @@ private object GpuOrcFileFilterHandler {
       fs: FileSystem,
       conf: Configuration,
       metrics: Map[String, GpuMetric]): OrcTail = {
-    val fileIO = new HadoopFileIO(conf)
+    val fileIO = new HadoopFileIO(
+      conf,
+      PerfIOHadoopInputFileFactory.INSTANCE)
     val inputFile = fileIO.newInputFile(filePath)
     val cachedFooter = FileCache.get.getFooter(inputFile)
     val bb = cachedFooter.map { hmb =>
@@ -1832,7 +1836,7 @@ private object GpuOrcFileFilterHandler {
       val fileSize = bb.getLong
       val modificationTime = bb.getLong
       val serializedTail = bb.slice()
-      bb.position(0)
+      bb.asInstanceOf[Buffer].position(0)
       // last byte is the size of the postscript section
       val psSize = bb.get(bb.limit() - 1) & 0xff
       val ps = loadPostScript(bb, psSize)
@@ -1866,8 +1870,8 @@ private object GpuOrcFileFilterHandler {
         val bb = ByteBuffer.allocate(footerSizeGuess)
         val readSize = fileSize.min(footerSizeGuess).toInt
         in.readFully(fileSize - readSize, bb.array(), bb.arrayOffset(), readSize)
-        bb.position(0)
-        bb.limit(readSize)
+        bb.asInstanceOf[Buffer].position(0)
+        bb.asInstanceOf[Buffer].limit(readSize)
         val psLen = bb.get(readSize - 1) & 0xff
         ensureOrcFooter(in, filePath, psLen, bb)
         val psOffset = readSize - 1 - psLen
@@ -1878,18 +1882,18 @@ private object GpuOrcFileFilterHandler {
         // calculate the amount of tail data that was missed in the speculative initial read
         val unreadRemaining = Math.max(0, tailSize - readSize)
         // copy tail bytes from original buffer
-        bb.position(Math.max(0, readSize - tailSize))
-        tailBuffer.position(TAIL_PREFIX_SIZE + unreadRemaining)
+        bb.asInstanceOf[Buffer].position(Math.max(0, readSize - tailSize))
+        tailBuffer.asInstanceOf[Buffer].position(TAIL_PREFIX_SIZE + unreadRemaining)
         tailBuffer.put(bb)
         if (unreadRemaining > 0) {
           // first read did not grab the entire tail, need to read more
-          tailBuffer.position(TAIL_PREFIX_SIZE)
+          tailBuffer.asInstanceOf[Buffer].position(TAIL_PREFIX_SIZE)
           in.readFully(fileSize - readSize - unreadRemaining, tailBuffer.array(),
             tailBuffer.arrayOffset() + tailBuffer.position(), unreadRemaining)
         }
         tailBuffer.putLong(0, fileSize)
         tailBuffer.putLong(java.lang.Long.BYTES, modificationTime)
-        tailBuffer.position(0)
+        tailBuffer.asInstanceOf[Buffer].position(0)
         tailBuffer
       }
     }
@@ -2044,26 +2048,26 @@ class MultiFileCloudOrcPartitionReader(
     keepReadsInOrder = keepReadsInOrder, combineConf = combineConf)
   with MultiFileReaderFunctions with OrcPartitionReaderBase {
 
-  private case class HostMemoryEmptyMetaData(
+  private class HostMemoryEmptyMetaData(
       override val partitionedFile: PartitionedFile,
-      numRows: Long,
+      val numRows: Long,
       override val bytesRead: Long,
-      readSchema: StructType,
-      override val allPartValues: Option[Array[(Long, InternalRow)]] = None)
+      val readSchema: StructType,
+      override val allPartValues: Option[Array[(Long, InternalRow)]])
     extends HostMemoryBuffersWithMetaDataBase {
 
     override def memBuffersAndSizes: Array[SingleHMBAndMeta] =
       Array(SingleHMBAndMeta.empty(numRows))
   }
 
-  private case class HostMemoryBuffersWithMetaData(
+  private class HostMemoryBuffersWithMetaData(
       override val partitionedFile: PartitionedFile,
       override val memBuffersAndSizes: Array[SingleHMBAndMeta],
       override val bytesRead: Long,
-      updatedReadSchema: TypeDescription,
-      compressionKind: CompressionKind,
-      requestedMapping: Option[Array[Int]],
-      override val allPartValues: Option[Array[(Long, InternalRow)]] = None)
+      val updatedReadSchema: TypeDescription,
+      val compressionKind: CompressionKind,
+      val requestedMapping: Option[Array[Int]],
+      override val allPartValues: Option[Array[(Long, InternalRow)]])
     extends HostMemoryBuffersWithMetaDataBase
 
   private class ReadBatchRunner(
@@ -2083,13 +2087,13 @@ class MultiFileCloudOrcPartitionReader(
       } catch {
         case e: FileNotFoundException if ignoreMissingFiles =>
           logWarning(s"Skipped missing file: ${partFile.filePath}", e)
-          HostMemoryEmptyMetaData(partFile, 0, 0, null)
+          new HostMemoryEmptyMetaData(partFile, 0, 0, null, None)
         // Throw FileNotFoundException even if `ignoreCorruptFiles` is true
         case e: FileNotFoundException if !ignoreMissingFiles => throw e
         case e @ (_: RuntimeException | _: IOException) if ignoreCorruptFiles =>
           logWarning(
             s"Skipped the rest of the content in the corrupted file: ${partFile.filePath}", e)
-          HostMemoryEmptyMetaData(partFile, 0, 0, null)
+          new HostMemoryEmptyMetaData(partFile, 0, 0, null, None)
       } finally {
         RmmSpark.poolThreadFinishedForTask(taskContext.taskAttemptId())
         TrampolineUtil.unsetTaskContext()
@@ -2109,7 +2113,7 @@ class MultiFileCloudOrcPartitionReader(
         if (ctx == null || ctx.blockIterator.isEmpty) {
           val bytesRead = fileSystemBytesRead() - startingBytesRead
           logDebug(s"Read no blocks from file: ${partFile.filePath.toString}")
-          HostMemoryEmptyMetaData(partFile, 0, bytesRead, readDataSchema)
+          new HostMemoryEmptyMetaData(partFile, 0, bytesRead, readDataSchema, None)
         } else {
           blockChunkIter = ctx.blockIterator
           if (isDone) {
@@ -2117,21 +2121,21 @@ class MultiFileCloudOrcPartitionReader(
             // got close before finishing
             logDebug("Reader is closed, return empty buffer for the current read for " +
               s"file: ${partFile.filePath.toString}")
-            HostMemoryEmptyMetaData(partFile, 0, bytesRead, readDataSchema)
+            new HostMemoryEmptyMetaData(partFile, 0, bytesRead, readDataSchema, None)
           } else {
             if (ctx.updatedReadSchema.isEmpty) {
               val bytesRead = fileSystemBytesRead() - startingBytesRead
               val numRows = ctx.blockIterator.map(_.infoBuilder.getNumberOfRows).sum
               logDebug(s"Return empty buffer but with row number: $numRows for " +
                 s"file: ${partFile.filePath.toString}")
-              HostMemoryEmptyMetaData(partFile, numRows, bytesRead, readDataSchema)
+              new HostMemoryEmptyMetaData(partFile, numRows, bytesRead, readDataSchema, None)
             } else {
               while (blockChunkIter.hasNext) {
                 val blocksToRead = populateCurrentBlockChunk(blockChunkIter, maxReadBatchSizeRows,
                   maxReadBatchSizeBytes)
                 val (hostBuf, bufSize) = readPartFile(ctx, blocksToRead)
                 val numRows = blocksToRead.map(_.infoBuilder.getNumberOfRows).sum
-                val metas = blocksToRead.map(b => OrcDataStripe(OrcStripeWithMeta(b, ctx)))
+                val metas = blocksToRead.map(b => new OrcDataStripe(new OrcStripeWithMeta(b, ctx)))
                 hostBuffers += SingleHMBAndMeta(Array(hostBuf), bufSize, numRows, metas)
               }
               val bytesRead = fileSystemBytesRead() - startingBytesRead
@@ -2140,10 +2144,10 @@ class MultiFileCloudOrcPartitionReader(
                 hostBuffers.safeClose()
                 logDebug("Reader is closed, return empty buffer for the current read for " +
                   s"file: ${partFile.filePath.toString}")
-                HostMemoryEmptyMetaData(partFile, 0, bytesRead, readDataSchema)
+                new HostMemoryEmptyMetaData(partFile, 0, bytesRead, readDataSchema, None)
               } else {
-                HostMemoryBuffersWithMetaData(partFile, hostBuffers.toArray, bytesRead,
-                  ctx.updatedReadSchema, ctx.compressionKind, ctx.requestedMapping)
+                new HostMemoryBuffersWithMetaData(partFile, hostBuffers.toArray, bytesRead,
+                  ctx.updatedReadSchema, ctx.compressionKind, ctx.requestedMapping, None)
               }
             }
           }
@@ -2159,10 +2163,10 @@ class MultiFileCloudOrcPartitionReader(
     }
   }
 
-  private case class CombinedMeta(
-    combinedEmptyMeta: Option[HostMemoryEmptyMetaData],
-    allPartValues: Array[(Long, InternalRow)],
-    toCombine: Array[HostMemoryBuffersWithMetaDataBase])
+  private class CombinedMeta(
+    val combinedEmptyMeta: Option[HostMemoryEmptyMetaData],
+    val allPartValues: Array[(Long, InternalRow)],
+    val toCombine: Array[HostMemoryBuffersWithMetaDataBase])
 
   /**
    * The sub-class must implement the real file reading logic in a Callable
@@ -2255,7 +2259,9 @@ class MultiFileCloudOrcPartitionReader(
           buffer.partitionedFile, buffer.allPartValues)
         if (memBuffersAndSize.length > 1) {
           val updatedBuffers = memBuffersAndSize.drop(1)
-          currentFileHostBuffers = Some(buffer.copy(memBuffersAndSizes = updatedBuffers))
+          currentFileHostBuffers = Some(new HostMemoryBuffersWithMetaData(
+            buffer.partitionedFile, updatedBuffers, buffer.bytesRead, buffer.updatedReadSchema,
+            buffer.compressionKind, buffer.requestedMapping, buffer.allPartValues))
         } else {
           currentFileHostBuffers = None
         }
@@ -2399,9 +2405,10 @@ class MultiFileCloudOrcPartitionReader(
             SpillPriorities.ACTIVE_BATCHING_PRIORITY)
           val combinedRet = SingleHMBAndMeta(Array(finalBuf), outStream.getPos, numRows,
             blockMetas)
-          val newHmbWithMeta = metaToUse.copy(
-            memBuffersAndSizes = Array(combinedRet),
-            allPartValues = Some(combinedMeta.allPartValues))
+          val newHmbWithMeta = new HostMemoryBuffersWithMetaData(
+            metaToUse.partitionedFile, Array(combinedRet), metaToUse.bytesRead,
+            metaToUse.updatedReadSchema, metaToUse.compressionKind, metaToUse.requestedMapping,
+            Some(combinedMeta.allPartValues))
           val filterTime = combinedMeta.toCombine.map(_.getFilterTime).sum
           val bufferTime = combinedMeta.toCombine.map(_.getBufferTime).sum
           newHmbWithMeta.setExecutionTime(filterTime, bufferTime)
@@ -2488,7 +2495,7 @@ class MultiFileCloudOrcPartitionReader(
 
     val combinedEmptyMeta = if (allEmpty) {
       // metaForEmpty should not be null here
-      Some(HostMemoryEmptyMetaData(
+      Some(new HostMemoryEmptyMetaData(
         metaForEmpty.partitionedFile, // not used, so pick one
         emptyNumRows, emptyTotalBytesRead,
         metaForEmpty.readSchema,
@@ -2496,7 +2503,7 @@ class MultiFileCloudOrcPartitionReader(
     } else {
       None
     }
-    CombinedMeta(combinedEmptyMeta, allPartValues.toArray, toCombine.toArray)
+    new CombinedMeta(combinedEmptyMeta, allPartValues.toArray, toCombine.toArray)
   }
 }
 
@@ -2536,13 +2543,13 @@ trait OrcCodecWritingHelper {
 }
 
 // Orc schema wrapper
-private case class OrcSchemaWrapper(schema: TypeDescription) extends SchemaBase {
+private class OrcSchemaWrapper(val schema: TypeDescription) extends SchemaBase with Serializable {
 
   override def isEmpty: Boolean = schema.getFieldNames.isEmpty
 }
 
-case class OrcStripeWithMeta(stripe: OrcOutputStripe, ctx: OrcPartitionReaderContext)
-    extends OrcCodecWritingHelper {
+class OrcStripeWithMeta(val stripe: OrcOutputStripe, val ctx: OrcPartitionReaderContext)
+    extends OrcCodecWritingHelper with Serializable {
 
   lazy val stripeLength: Long = {
     // calculate the true stripe footer size
@@ -2557,7 +2564,8 @@ case class OrcStripeWithMeta(stripe: OrcOutputStripe, ctx: OrcPartitionReaderCon
 }
 
 // OrcOutputStripe wrapper
-private[rapids] case class OrcDataStripe(stripeMeta: OrcStripeWithMeta) extends DataBlockBase {
+private[rapids] class OrcDataStripe(val stripeMeta: OrcStripeWithMeta)
+    extends DataBlockBase with Serializable {
 
   override def getRowCount: Long = stripeMeta.stripe.infoBuilder.getNumberOfRows
 
@@ -2568,17 +2576,17 @@ private[rapids] case class OrcDataStripe(stripeMeta: OrcStripeWithMeta) extends
 }
 
 /** Orc extra information containing the requested column ids for the current coalescing stripes */
-case class OrcExtraInfo(requestedMapping: Option[Array[Int]]) extends ExtraInfo
+class OrcExtraInfo(val requestedMapping: Option[Array[Int]]) extends ExtraInfo with Serializable
 
 // Contains meta about a single stripe of an ORC file
-private case class OrcSingleStripeMeta(
-  filePath: Path, // Orc file path
-  dataBlock: OrcDataStripe, // Orc stripe information with the OrcPartitionReaderContext
-  partitionValues: InternalRow, // partitioned values
-  schema: OrcSchemaWrapper, // Orc schema
-  readSchema: StructType, // Orc read schema
-  extraInfo: OrcExtraInfo // Orc ExtraInfo containing the requested column ids
-) extends SingleDataBlockInfo
+private class OrcSingleStripeMeta(
+  val filePath: Path, // Orc file path
+  val dataBlock: OrcDataStripe, // Orc stripe information with the OrcPartitionReaderContext
+  val partitionValues: InternalRow, // partitioned values
+  val schema: OrcSchemaWrapper, // Orc schema
+  val readSchema: StructType, // Orc read schema
+  val extraInfo: OrcExtraInfo // Orc ExtraInfo containing the requested column ids
+) extends SingleDataBlockInfo with Serializable
 
 /**
  *
@@ -2840,7 +2848,15 @@ class MultiFileOrcPartitionReader(
   }
 }
 
-object MakeOrcTableProducer extends Logging {
+object MakeOrcTableProducer {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
   def apply(
       useChunkedReader: Boolean,
       maxChunkedReaderMemoryUsageSizeBytes: Long,
@@ -2865,7 +2881,7 @@ object MakeOrcTableProducer extends Logging {
       }
     }
     if (useChunkedReader) {
-      OrcTableReader(conf, chunkSizeByteLimit, maxChunkedReaderMemoryUsageSizeBytes,
+      new OrcTableReader(conf, chunkSizeByteLimit, maxChunkedReaderMemoryUsageSizeBytes,
         parseOpts, buffer, offset, bufferSize, metrics,  isSchemaCaseSensitive, readDataSchema,
         tableSchema, splits, debugDumpPrefix, debugDumpAlways)
     } else {
@@ -2905,7 +2921,7 @@ object MakeOrcTableProducer extends Logging {
   }
 }
 
-case class OrcTableReader(
+class OrcTableReader(
     conf: Configuration,
     chunkSizeByteLimit: Long,
     maxChunkedReaderMemoryUsageSizeBytes: Long,
@@ -2919,7 +2935,7 @@ case class OrcTableReader(
     tableSchema: TypeDescription,
     splits: Array[PartitionedFile],
     debugDumpPrefix: Option[String],
-    debugDumpAlways: Boolean) extends GpuDataProducer[Table] with Logging {
+    debugDumpAlways: Boolean) extends GpuDataProducer[Table] with RapidsLocalLog with Serializable {
 
   private[this] val reader = new ORCChunkedReader(chunkSizeByteLimit,
     maxChunkedReaderMemoryUsageSizeBytes, parseOpts, buffer, offset, bufferSize)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcTimezoneUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcTimezoneUtils.scala
deleted file mode 100644
index 9ef9d5f6ebb..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOrcTimezoneUtils.scala
+++ /dev/null
@@ -1,151 +0,0 @@
-/*
- * Copyright (c) 2025, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import ai.rapids.cudf.{ColumnView, DType, Scalar, Table}
-import com.nvidia.spark.rapids.Arm.withResource
-import com.nvidia.spark.rapids.RapidsPluginImplicits.AutoCloseableProducingSeq
-import java.time.{LocalDateTime, ZoneId}
-import java.util.Optional
-import scala.collection.mutable.ArrayBuffer
-
-object GpuOrcTimezoneUtils {
-
-  /**
-   * Get the offset in microseconds for 2025-01-01 between JVM timezone and UTC timezone.
-   * @param jvmTz the JVM timezone to calculate the offset for
-   * @return the offset in microseconds
-   *         between the JVM timezone and UTC timezone for 2025-01-01
-   *         This is used to rebase the timestamp columns in the input table.
-   */
-  private def getOffsetForJanuaryFirst2015(jvmTz: ZoneId): Long = {
-    val t1 = LocalDateTime.of(2015, 1, 1, 0, 0, 0).atZone(jvmTz).toInstant.getEpochSecond
-    val t2 = LocalDateTime.of(2015, 1, 1, 0, 0, 0).atZone(ZoneId.of("UTC")).toInstant.getEpochSecond
-    val diffMicros: Long = (t2 - t1) * 1000000L // convert seconds to microseconds
-    diffMicros
-  }
-
-  /**
-   * Recursively rebase the timestamp columns in the input column view to the target timezone.
-   * It handles nested types: list and struct.
-   * The rebase logic is simple: just subtract the offset in microseconds between the
-   * target timezone and UTC timezone.
-   * For more details about the rebase logic, please refer to:
-   * https://github.com/apache/orc/blob/rel/release-1.9.1/
-   * java/core/src/java/org/apache/orc/impl/TreeReaderFactory.java#L1157
-   * `TimestampTreeReader.getBaseTimestamp` generates the base timestamp with JVM default timezone.
-   * `threadLocalDateFormat.get().setTimeZone(writerTimeZone);`
-   * The above writerTimeZone is not the timezone in the ORC file stripe footer,
-   * it is the default JVM timezone.
-   * `TimestampTreeReader.readTimestamp` applies the diff:
-   *   `long millis = (data.next() + base_timestamp)`
-   * Note: the input timestamp columns are read as in the UTC timezone.
-   *
-   */
-  private def rebaseTimestampRecursively(
-                                          col: ColumnView,
-                                          toZoneId: ZoneId,
-                                          toClose: ArrayBuffer[ColumnView],
-                                          diffMicros: Long): ColumnView = {
-
-    // Util function to add a view to the buffer "toClose".
-    val addToClose = (v: ColumnView) => {
-      toClose += v
-      v
-    }
-
-    val dType = col.getType
-    if (dType.hasTimeResolution) {
-      assert(dType == DType.TIMESTAMP_MICROSECONDS,
-        s"Only TIMESTAMP_MICROSECONDS is supported, but got $dType")
-
-      // 1. timestamp type, rebase timestamp column
-      withResource(col.bitCastTo(DType.INT64)) { longs =>
-        withResource(Scalar.fromLong(diffMicros)) { offsetScalar =>
-          withResource(longs.sub(offsetScalar)) { rebased =>
-            rebased.castTo(DType.TIMESTAMP_MICROSECONDS)
-          }
-        }
-      }
-    } else if (dType == DType.LIST) {
-      // 2. nest list type
-      val child = addToClose(col.getChildColumnView(0))
-      val newChild = rebaseTimestampRecursively(child, toZoneId, toClose, diffMicros)
-      if (newChild != child) {
-        col.replaceListChild(addToClose(newChild))
-      } else {
-        col
-      }
-    } else if (dType == DType.STRUCT) {
-      // 3. nest struct type
-      val newViews = (0 until col.getNumChildren).safeMap { i =>
-        val child = addToClose(col.getChildColumnView(i))
-        val newChild = rebaseTimestampRecursively(child, toZoneId, toClose, diffMicros)
-        if (newChild != child) {
-          addToClose(newChild)
-        }
-        newChild
-      }
-      val opNullCount = Optional.of(col.getNullCount.asInstanceOf[java.lang.Long])
-      new ColumnView(col.getType, col.getRowCount, opNullCount, col.getValid,
-        col.getOffsets, newViews.toArray)
-    } else {
-      // 4. other types, no need to rebase
-      col
-    }
-  }
-
-  /**
-   * Rebase the timestamp columns in the input table to the system default timezone.
-   * If the system's default timezone is UTC, it returns the input table as it is.
-   *
-   * @param input the input table, it will be closed after returning
-   * @return a new table with rebased timestamp columns
-   */
-  def rebaseTimeZone(input: Table): Table = {
-    val toZoneId = ZoneId.systemDefault()
-
-    if (toZoneId == ZoneId.of("UTC")) {
-      // UTC timezone, no need to rebase
-      return input
-    }
-
-    // get the offset in microseconds for 2015-01-01 between JVM timezone and UTC timezone
-    val diffMicros = getOffsetForJanuaryFirst2015(toZoneId)
-
-    withResource(input) { _ =>
-      val newColumns = (0 until input.getNumberOfColumns).safeMap { colIdx =>
-        val col = input.getColumn(colIdx)
-        withResource(new ArrayBuffer[ColumnView]) { toClose =>
-          val rebased = rebaseTimestampRecursively(col, toZoneId, toClose, diffMicros)
-          if (col == rebased) {
-            // no change
-            col.incRefCount()
-          } else {
-            // rebased, copy the new column
-            toClose += rebased
-            rebased.copyToColumnVector()
-          }
-        }
-      }
-
-      withResource(newColumns) { _ =>
-        new Table(newColumns: _*)
-      }
-    }
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOverrides.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOverrides.scala
index f82d903fc8a..086db5183cf 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOverrides.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuOverrides.scala
@@ -30,7 +30,6 @@ import com.nvidia.spark.rapids.shims._
 import com.nvidia.spark.rapids.window.{GpuDenseRank, GpuLag, GpuLead, GpuPercentRank, GpuRank, GpuRowNumber, GpuSpecialFrameBoundary, GpuWindowExecMeta, GpuWindowSpecDefinitionMeta}
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.rapids.hybrid.HybridExecutionUtils
 import org.apache.spark.sql.{DataFrame, SparkSession}
 import org.apache.spark.sql.catalyst.expressions._
@@ -457,7 +456,157 @@ object WriteFileOp extends FileFormatOp {
   override def toString = "write"
 }
 
-object GpuOverrides extends Logging {
+object GpuOverrides {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
+  private def confValueToString(value: Any): String = value.toString
+
+  private def dataTypeExistsRecursively(
+      dataType: DataType,
+      f: DataType => Boolean): Boolean = {
+    f(dataType) || (dataType match {
+      case ArrayType(elementType, _) =>
+        dataTypeExistsRecursively(elementType, f)
+      case MapType(keyType, valueType, _) =>
+        dataTypeExistsRecursively(keyType, f) || dataTypeExistsRecursively(valueType, f)
+      case StructType(fields) =>
+        fields.exists(field => dataTypeExistsRecursively(field.dataType, f))
+      case _ => false
+    })
+  }
+
+  // Keep version-specific shim rule registries out of this object's constant pool.
+  private def shimSingleton(name: String): AnyRef = {
+    Class.forName("com.nvidia.spark.rapids.shims." + name + "$")
+      .getField("MODULE" + "$")
+      .get(null)
+      .asInstanceOf[AnyRef]
+  }
+
+  private def invokeShimSingleton(name: String, method: String): Any = {
+    val module = shimSingleton(name)
+    module.getClass.getMethod(method).invoke(module)
+  }
+
+  private def shimExprs(
+      name: String): Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = {
+    invokeShimSingleton(name, "exprs")
+      .asInstanceOf[Map[Class[_ <: Expression], ExprRule[_ <: Expression]]]
+  }
+
+  private def shimExprRules(
+      name: String,
+      method: String): Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = {
+    invokeShimSingleton(name, method)
+      .asInstanceOf[Map[Class[_ <: Expression], ExprRule[_ <: Expression]]]
+  }
+
+  private def shimExprRule(name: String, method: String): ExprRule[_ <: Expression] = {
+    invokeShimSingleton(name, method).asInstanceOf[ExprRule[_ <: Expression]]
+  }
+
+  private def shimScanRules(
+      name: String,
+      method: String): Map[Class[_ <: Scan], ScanRule[_ <: Scan]] = {
+    invokeShimSingleton(name, method)
+      .asInstanceOf[Map[Class[_ <: Scan], ScanRule[_ <: Scan]]]
+  }
+
+  private def shimPartRules(
+      name: String,
+      method: String): Map[Class[_ <: Partitioning], PartRule[_ <: Partitioning]] = {
+    invokeShimSingleton(name, method)
+      .asInstanceOf[Map[Class[_ <: Partitioning], PartRule[_ <: Partitioning]]]
+  }
+
+  private def shimDataWriteCmdRules(
+      name: String,
+      method: String): Map[Class[_ <: DataWritingCommand],
+      DataWritingCommandRule[_ <: DataWritingCommand]] = {
+    invokeShimSingleton(name, method)
+      .asInstanceOf[Map[Class[_ <: DataWritingCommand],
+        DataWritingCommandRule[_ <: DataWritingCommand]]]
+  }
+
+  private def shimRunnableCmdRules(
+      name: String,
+      method: String): Map[Class[_ <: RunnableCommand],
+      RunnableCommandRule[_ <: RunnableCommand]] = {
+    invokeShimSingleton(name, method)
+      .asInstanceOf[Map[Class[_ <: RunnableCommand],
+        RunnableCommandRule[_ <: RunnableCommand]]]
+  }
+
+  private def shimExecRules(
+      name: String,
+      method: String): Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]] = {
+    invokeShimSingleton(name, method)
+      .asInstanceOf[Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]]]
+  }
+
+  private def shimExecRule(name: String, method: String): ExecRule[_ <: SparkPlan] = {
+    invokeShimSingleton(name, method).asInstanceOf[ExecRule[_ <: SparkPlan]]
+  }
+
+  private def optionalShimExecRule(name: String, method: String): ExecRule[_ <: SparkPlan] = {
+    invokeShimSingleton(name, method)
+      .asInstanceOf[Option[ExecRule[_ <: SparkPlan]]]
+      .orNull
+  }
+
+  @transient private[this] lazy val aggregateInPandasExecShimsModule = {
+    Class.forName("com.nvidia.spark.rapids.shims.AggregateInPandasExecShims" + "$")
+      .getField("MODULE" + "$")
+      .get(null)
+  }
+
+  @transient private[this] lazy val aggregateInPandasExecRuleMethod =
+    aggregateInPandasExecShimsModule.getClass.getMethod("execRule")
+
+  private def aggregateInPandasExecRule: ExecRule[_ <: SparkPlan] = {
+    aggregateInPandasExecRuleMethod.invoke(aggregateInPandasExecShimsModule)
+      .asInstanceOf[Option[ExecRule[_ <: SparkPlan]]]
+      .orNull
+  }
+
+  @transient private[this] lazy val batchScanExecMetaConstructor =
+    Class.forName("com.nvidia.spark.rapids.shims.BatchScanExecMeta")
+      .getConstructor(classOf[BatchScanExec], classOf[RapidsConf],
+        classOf[Option[_]], classOf[DataFromReplacementRule])
+
+  private def newBatchScanExecMeta(
+      p: BatchScanExec,
+      conf: RapidsConf,
+      parent: Option[RapidsMeta[_, _, _]],
+      rule: DataFromReplacementRule): SparkPlanMeta[BatchScanExec] = {
+    batchScanExecMetaConstructor.newInstance(p, conf, parent, rule)
+      .asInstanceOf[SparkPlanMeta[BatchScanExec]]
+  }
+
+  @transient private[this] lazy val gpuSubqueryBroadcastMetaConstructor =
+    Class.forName("org.apache.spark.sql.rapids.execution.GpuSubqueryBroadcastMeta")
+      .getConstructor(classOf[SubqueryBroadcastExec], classOf[RapidsConf],
+        classOf[Option[_]], classOf[DataFromReplacementRule])
+
+  private def newGpuSubqueryBroadcastMeta(
+      plan: SubqueryBroadcastExec,
+      conf: RapidsConf,
+      parent: Option[RapidsMeta[_, _, _]],
+      rule: DataFromReplacementRule): SparkPlanMeta[SubqueryBroadcastExec] = {
+    gpuSubqueryBroadcastMetaConstructor.newInstance(plan, conf, parent, rule)
+      .asInstanceOf[SparkPlanMeta[SubqueryBroadcastExec]]
+  }
+
   val FLOAT_DIFFERS_GROUP_INCOMPAT =
     "when enabling these, there may be extra groups produced for floating point grouping " +
     "keys (e.g. -0.0, and 0.0)"
@@ -718,13 +867,13 @@ object GpuOverrides extends Logging {
     expressions.exists(isStringLit)
 
   def isOrContainsFloatingPoint(dataType: DataType): Boolean =
-    TrampolineUtil.dataTypeExistsRecursively(dataType, dt => dt == FloatType || dt == DoubleType)
+    dataTypeExistsRecursively(dataType, dt => dt == FloatType || dt == DoubleType)
 
   def isOrContainsDateOrTimestamp(dataType: DataType): Boolean =
-    TrampolineUtil.dataTypeExistsRecursively(dataType, dt => dt == TimestampType || dt == DateType)
+    dataTypeExistsRecursively(dataType, dt => dt == TimestampType || dt == DateType)
 
   def isOrContainsTimestamp(dataType: DataType): Boolean =
-    TrampolineUtil.dataTypeExistsRecursively(dataType, dt => dt == TimestampType)
+    dataTypeExistsRecursively(dataType, dt => dt == TimestampType)
 
   /** Tries to predict whether an adaptive plan will end up with data on the GPU or not. */
   def probablyGpuPlan(adaptivePlan: AdaptiveSparkPlanExec, conf: RapidsConf): Boolean = {
@@ -849,6 +998,15 @@ object GpuOverrides extends Logging {
     new ExecRule[INPUT](doWrap, desc, Some(pluginChecks), tag)
   }
 
+  def execFromShim[INPUT <: SparkPlan](
+      rule: ShimExecRule[INPUT],
+      pluginChecks: ExecChecks,
+      doWrap: (INPUT, RapidsConf, Option[RapidsMeta[_, _, _]], DataFromReplacementRule)
+          => SparkPlanMeta[INPUT]): ExecRule[INPUT] = {
+    assert(rule != null)
+    exec(rule.desc, pluginChecks, doWrap)(rule.tag)
+  }
+
   def dataWriteCmd[INPUT <: DataWritingCommand](
       desc: String,
       doWrap: (INPUT, RapidsConf, Option[RapidsMeta[_, _, _]], DataFromReplacementRule)
@@ -859,6 +1017,14 @@ object GpuOverrides extends Logging {
     new DataWritingCommandRule[INPUT](doWrap, desc, tag)
   }
 
+  def dataWriteCmdFromShim[INPUT <: DataWritingCommand](
+      rule: ShimDataWritingCommandRule[INPUT],
+      doWrap: (INPUT, RapidsConf, Option[RapidsMeta[_, _, _]], DataFromReplacementRule)
+          => DataWritingCommandMeta[INPUT]): DataWritingCommandRule[INPUT] = {
+    assert(rule != null)
+    dataWriteCmd(rule.desc, doWrap)(rule.tag)
+  }
+
   def wrapExpr[INPUT <: Expression](
       expr: INPUT,
       conf: RapidsConf,
@@ -1025,8 +1191,8 @@ object GpuOverrides extends Logging {
       ExprChecks.windowOnly(
         TypeSig.all,
         TypeSig.all,
-        Seq(ParamCheck("windowFunction", TypeSig.all, TypeSig.all),
-          ParamCheck("windowSpec",
+        Seq(new ParamCheck("windowFunction", TypeSig.all, TypeSig.all),
+          new ParamCheck("windowSpec",
             TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral + TypeSig.DECIMAL_64,
             TypeSig.numericAndInterval))),
       (windowExpression, conf, p, r) => new GpuWindowExpressionMeta(windowExpression, conf, p, r)),
@@ -1037,11 +1203,11 @@ object GpuOverrides extends Logging {
         TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral,
         TypeSig.numericAndInterval,
         Seq(
-          ParamCheck("lower",
+          new ParamCheck("lower",
             TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral + TypeSig.DECIMAL_128 +
               TypeSig.FLOAT + TypeSig.DOUBLE,
             TypeSig.numericAndInterval),
-          ParamCheck("upper",
+          new ParamCheck("upper",
             TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral + TypeSig.DECIMAL_128 +
               TypeSig.FLOAT + TypeSig.DOUBLE,
             TypeSig.numericAndInterval))),
@@ -1077,7 +1243,7 @@ object GpuOverrides extends Logging {
       "Window function that returns the index for the row within the aggregation window",
       ExprChecks.windowOnly(TypeSig.INT, TypeSig.INT,
         repeatingParamCheck =
-          Some(RepeatingParamCheck("ordering",
+          Some(new RepeatingParamCheck("ordering",
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL,
             TypeSig.all))),
       (rowNumber, conf, p, r) => new ExprMeta[RowNumber](rowNumber, conf, p, r) {
@@ -1087,7 +1253,7 @@ object GpuOverrides extends Logging {
       "Window function that returns the rank value within the aggregation window",
       ExprChecks.windowOnly(TypeSig.INT, TypeSig.INT,
         repeatingParamCheck =
-          Some(RepeatingParamCheck("ordering",
+          Some(new RepeatingParamCheck("ordering",
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL,
             TypeSig.all))),
       (rank, conf, p, r) => new ExprMeta[Rank](rank, conf, p, r) {
@@ -1097,7 +1263,7 @@ object GpuOverrides extends Logging {
       "Window function that returns the dense rank value within the aggregation window",
       ExprChecks.windowOnly(TypeSig.INT, TypeSig.INT,
         repeatingParamCheck =
-          Some(RepeatingParamCheck("ordering",
+          Some(new RepeatingParamCheck("ordering",
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL,
             TypeSig.all))),
       (denseRank, conf, p, r) => new ExprMeta[DenseRank](denseRank, conf, p, r) {
@@ -1108,7 +1274,7 @@ object GpuOverrides extends Logging {
       "Window function that returns the percent rank value within the aggregation window",
       ExprChecks.windowOnly(TypeSig.DOUBLE, TypeSig.DOUBLE,
         repeatingParamCheck =
-          Some(RepeatingParamCheck("ordering",
+          Some(new RepeatingParamCheck("ordering",
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL,
             TypeSig.all))),
       (percentRank, conf, p, r) => new ExprMeta[PercentRank](percentRank, conf, p, r) {
@@ -1122,12 +1288,12 @@ object GpuOverrides extends Logging {
           TypeSig.ARRAY + TypeSig.STRUCT).nested(),
         TypeSig.all,
         Seq(
-          ParamCheck("input",
+          new ParamCheck("input",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
               TypeSig.NULL + TypeSig.ARRAY + TypeSig.STRUCT).nested(),
             TypeSig.all),
-          ParamCheck("offset", TypeSig.INT, TypeSig.INT),
-          ParamCheck("default",
+          new ParamCheck("offset", TypeSig.INT, TypeSig.INT),
+          new ParamCheck("default",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
               TypeSig.ARRAY + TypeSig.STRUCT).nested(),
             TypeSig.all)
@@ -1144,12 +1310,12 @@ object GpuOverrides extends Logging {
           TypeSig.ARRAY + TypeSig.STRUCT).nested(),
         TypeSig.all,
         Seq(
-          ParamCheck("input",
+          new ParamCheck("input",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
               TypeSig.NULL + TypeSig.ARRAY + TypeSig.STRUCT).nested(),
             TypeSig.all),
-          ParamCheck("offset", TypeSig.INT, TypeSig.INT),
-          ParamCheck("default",
+          new ParamCheck("offset", TypeSig.INT, TypeSig.INT),
+          new ParamCheck("default",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
               TypeSig.ARRAY + TypeSig.STRUCT).nested(),
             TypeSig.all)
@@ -1409,7 +1575,7 @@ object GpuOverrides extends Logging {
     expr[AtLeastNNonNulls](
       "Checks if number of non null/Nan values is greater than a given value",
       ExprChecks.projectOnly(TypeSig.BOOLEAN, TypeSig.BOOLEAN,
-        repeatingParamCheck = Some(RepeatingParamCheck("input",
+        repeatingParamCheck = Some(new RepeatingParamCheck("input",
           (TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 + TypeSig.BINARY +
               TypeSig.MAP + TypeSig.ARRAY + TypeSig.STRUCT).nested(),
           TypeSig.all))),
@@ -1524,7 +1690,7 @@ object GpuOverrides extends Logging {
       "Returns the bitwise AND of all non-null input values",
       ExprChecks.reductionAndGroupByAgg(
         TypeSig.integral, TypeSig.integral,
-        Seq(ParamCheck("input", TypeSig.integral, TypeSig.integral))),
+        Seq(new ParamCheck("input", TypeSig.integral, TypeSig.integral))),
       (a, conf, p, r) => new AggExprMeta[BitAndAgg](a, conf, p, r) {
         override def convertToGpu(childExprs: Seq[Expression]): GpuExpression =
           GpuBitAndAgg(childExprs.head)
@@ -1535,7 +1701,7 @@ object GpuOverrides extends Logging {
       "Returns the bitwise OR of all non-null input values",
       ExprChecks.reductionAndGroupByAgg(
         TypeSig.integral, TypeSig.integral,
-        Seq(ParamCheck("input", TypeSig.integral, TypeSig.integral))),
+        Seq(new ParamCheck("input", TypeSig.integral, TypeSig.integral))),
       (a, conf, p, r) => new AggExprMeta[BitOrAgg](a, conf, p, r) {
         override def convertToGpu(childExprs: Seq[Expression]): GpuExpression =
           GpuBitOrAgg(childExprs.head)
@@ -1546,7 +1712,7 @@ object GpuOverrides extends Logging {
       "Returns the bitwise XOR of all non-null input values",
       ExprChecks.reductionAndGroupByAgg(
         TypeSig.integral, TypeSig.integral,
-        Seq(ParamCheck("input", TypeSig.integral, TypeSig.integral))),
+        Seq(new ParamCheck("input", TypeSig.integral, TypeSig.integral))),
       (a, conf, p, r) => new AggExprMeta[BitXorAgg](a, conf, p, r) {
         override def convertToGpu(childExprs: Seq[Expression]): GpuExpression =
           GpuBitXorAgg(childExprs.head)
@@ -1559,7 +1725,7 @@ object GpuOverrides extends Logging {
         (gpuCommonTypes + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.BINARY +
           TypeSig.MAP + GpuTypeShims.additionalArithmeticSupportedTypes).nested(),
         TypeSig.all,
-        repeatingParamCheck = Some(RepeatingParamCheck("param",
+        repeatingParamCheck = Some(new RepeatingParamCheck("param",
           (gpuCommonTypes + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.BINARY +
             TypeSig.MAP + GpuTypeShims.additionalArithmeticSupportedTypes).nested(),
           TypeSig.all))),
@@ -1571,7 +1737,7 @@ object GpuOverrides extends Logging {
       "Returns the least value of all parameters, skipping null values",
       ExprChecks.projectOnly(
         TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128, TypeSig.orderable,
-        repeatingParamCheck = Some(RepeatingParamCheck("param",
+        repeatingParamCheck = Some(new RepeatingParamCheck("param",
           TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128,
           TypeSig.orderable))),
       (a, conf, p, r) => new ExprMeta[Least](a, conf, p, r) {
@@ -1581,7 +1747,7 @@ object GpuOverrides extends Logging {
       "Returns the greatest value of all parameters, skipping null values",
       ExprChecks.projectOnly(
         TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128, TypeSig.orderable,
-        repeatingParamCheck = Some(RepeatingParamCheck("param",
+        repeatingParamCheck = Some(new RepeatingParamCheck("param",
           TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128,
           TypeSig.orderable))),
       (a, conf, p, r) => new ExprMeta[Greatest](a, conf, p, r) {
@@ -1885,9 +2051,9 @@ object GpuOverrides extends Logging {
         "are the last day of month, time of day will be ignored. Otherwise, the difference is " +
         "calculated based on 31 days per month, and rounded to 8 digits unless roundOff=false.",
       ExprChecks.projectOnly(TypeSig.DOUBLE, TypeSig.DOUBLE,
-        Seq(ParamCheck("timestamp1", TypeSig.TIMESTAMP, TypeSig.TIMESTAMP),
-          ParamCheck("timestamp2", TypeSig.TIMESTAMP, TypeSig.TIMESTAMP),
-          ParamCheck("round", TypeSig.lit(TypeEnum.BOOLEAN), TypeSig.BOOLEAN))),
+        Seq(new ParamCheck("timestamp1", TypeSig.TIMESTAMP, TypeSig.TIMESTAMP),
+          new ParamCheck("timestamp2", TypeSig.TIMESTAMP, TypeSig.TIMESTAMP),
+          new ParamCheck("round", TypeSig.lit(TypeEnum.BOOLEAN), TypeSig.BOOLEAN))),
       (a, conf, p, r) => new MonthsBetweenExprMeta(a, conf, p, r)
     ),
     expr[TruncDate](
@@ -2061,9 +2227,9 @@ object GpuOverrides extends Logging {
     expr[In](
       "IN operator",
       ExprChecks.projectOnly(TypeSig.BOOLEAN, TypeSig.BOOLEAN,
-        Seq(ParamCheck("value", TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128,
+        Seq(new ParamCheck("value", TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128,
           TypeSig.comparable)),
-        Some(RepeatingParamCheck("list",
+        Some(new RepeatingParamCheck("list",
           (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128).withAllLit(),
           TypeSig.comparable))),
       (in, conf, p, r) => new ExprMeta[In](in, conf, p, r) {
@@ -2131,12 +2297,12 @@ object GpuOverrides extends Logging {
         (gpuCommonTypes + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP +
             TypeSig.BINARY + GpuTypeShims.additionalCommonOperatorSupportedTypes).nested(),
         TypeSig.all,
-        Seq(ParamCheck("predicate", TypeSig.BOOLEAN, TypeSig.BOOLEAN),
-          ParamCheck("trueValue",
+        Seq(new ParamCheck("predicate", TypeSig.BOOLEAN, TypeSig.BOOLEAN),
+          new ParamCheck("trueValue",
             (gpuCommonTypes + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP +
                 TypeSig.BINARY + GpuTypeShims.additionalCommonOperatorSupportedTypes).nested(),
             TypeSig.all),
-          ParamCheck("falseValue",
+          new ParamCheck("falseValue",
             (gpuCommonTypes + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP +
                 TypeSig.BINARY + GpuTypeShims.additionalCommonOperatorSupportedTypes).nested(),
             TypeSig.all))),
@@ -2162,8 +2328,8 @@ object GpuOverrides extends Logging {
       ExprChecks.fullAgg(
         TypeSig.all,
         TypeSig.all,
-        Seq(ParamCheck("aggFunc", TypeSig.all, TypeSig.all)),
-        Some(RepeatingParamCheck("filter", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
+        Seq(new ParamCheck("aggFunc", TypeSig.all, TypeSig.all)),
+        Some(new RepeatingParamCheck("filter", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
       (a, conf, p, r) => new ExprMeta[AggregateExpression](a, conf, p, r) {
         private val filter: Option[BaseExprMeta[_]] =
           a.filter.map(GpuOverrides.wrapExpr(_, this.conf, Some(this)))
@@ -2193,23 +2359,23 @@ object GpuOverrides extends Logging {
         pluginSupportedOrderableSig + TypeSig.ARRAY.nested(gpuCommonTypes)
             .withPsNote(TypeEnum.ARRAY, "STRUCT is not supported as a child type for ARRAY"),
         TypeSig.orderable,
-        Seq(ParamCheck(
+        Seq(new ParamCheck(
           "input",
           pluginSupportedOrderableSig + TypeSig.ARRAY.nested(gpuCommonTypes)
              .withPsNote(TypeEnum.ARRAY, "STRUCT is not supported as a child type for ARRAY"),
           TypeSig.orderable))),
-      GpuSortOrderMeta),
+      (sortOrder, conf, p, r) => new GpuSortOrderMeta(sortOrder, conf, p, r)),
     expr[PivotFirst](
       "PivotFirst operator",
       ExprChecks.reductionAndGroupByAgg(
         TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
           TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128),
         TypeSig.all,
-        Seq(ParamCheck(
+        Seq(new ParamCheck(
           "pivotColumn",
           (TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128),
           TypeSig.all),
-          ParamCheck("valueColumn",
+          new ParamCheck("valueColumn",
           TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128,
           TypeSig.all))),
       (pivot, conf, p, r) => new ImperativeAggExprMeta[PivotFirst](pivot, conf, p, r) {
@@ -2232,7 +2398,7 @@ object GpuOverrides extends Logging {
       "Count aggregate operator",
       ExprChecks.fullAgg(
         TypeSig.LONG, TypeSig.LONG,
-        repeatingParamCheck = Some(RepeatingParamCheck(
+        repeatingParamCheck = Some(new RepeatingParamCheck(
           "input", TypeSig.all, TypeSig.all))),
       (count, conf, p, r) => new AggExprMeta[Count](count, conf, p, r) {
 
@@ -2249,12 +2415,12 @@ object GpuOverrides extends Logging {
       }),
     expr[Max](
       "Max aggregate operator",
-      ExprChecksImpl(
+      new ExprChecksImpl(
         ExprChecks.reductionAndGroupByAgg(
           (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.STRUCT +
             TypeSig.ARRAY).nested(),
           TypeSig.orderable,
-          Seq(ParamCheck("input",
+          Seq(new ParamCheck("input",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.STRUCT +
               TypeSig.ARRAY).nested(),
             TypeSig.orderable))).asInstanceOf[ExprChecksImpl].contexts
@@ -2262,7 +2428,7 @@ object GpuOverrides extends Logging {
           ExprChecks.windowOnly(
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL),
             TypeSig.orderable,
-            Seq(ParamCheck("input",
+            Seq(new ParamCheck("input",
               (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL),
               TypeSig.orderable))).asInstanceOf[ExprChecksImpl].contexts),
       (max, conf, p, r) => new AggExprMeta[Max](max, conf, p, r) {
@@ -2274,12 +2440,12 @@ object GpuOverrides extends Logging {
       }),
     expr[Min](
       "Min aggregate operator",
-      ExprChecksImpl(
+      new ExprChecksImpl(
         ExprChecks.reductionAndGroupByAgg(
           (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.STRUCT +
               TypeSig.ARRAY).nested(),
           TypeSig.orderable,
-          Seq(ParamCheck("input",
+          Seq(new ParamCheck("input",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.STRUCT +
               TypeSig.ARRAY).nested(),
             TypeSig.orderable))).asInstanceOf[ExprChecksImpl].contexts
@@ -2287,7 +2453,7 @@ object GpuOverrides extends Logging {
           ExprChecks.windowOnly(
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL),
             TypeSig.orderable,
-            Seq(ParamCheck("input",
+            Seq(new ParamCheck("input",
               (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL),
               TypeSig.orderable))).asInstanceOf[ExprChecksImpl].contexts),
       (a, conf, p, r) => new AggExprMeta[Min](a, conf, p, r) {
@@ -2302,7 +2468,7 @@ object GpuOverrides extends Logging {
       ExprChecks.fullAgg(
         TypeSig.LONG + TypeSig.DOUBLE + TypeSig.DECIMAL_128,
         TypeSig.LONG + TypeSig.DOUBLE + TypeSig.DECIMAL_128,
-        Seq(ParamCheck("input", TypeSig.gpuNumeric, TypeSig.cpuNumeric))),
+        Seq(new ParamCheck("input", TypeSig.gpuNumeric, TypeSig.cpuNumeric))),
       (a, conf, p, r) => new AggExprMeta[Sum](a, conf, p, r) {
         override def tagAggForGpu(): Unit = {
           val inputDataType = a.child.dataType
@@ -2325,11 +2491,11 @@ object GpuOverrides extends Logging {
         (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY +
             TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
         TypeSig.all,
-        Seq(ParamCheck("input",
+        Seq(new ParamCheck("input",
           (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY +
               TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
           TypeSig.all),
-          ParamCheck("offset", TypeSig.lit(TypeEnum.INT), TypeSig.lit(TypeEnum.INT)))
+          new ParamCheck("offset", TypeSig.lit(TypeEnum.INT), TypeSig.lit(TypeEnum.INT)))
       ),
       (a, conf, p, r) => new AggExprMeta[NthValue](a, conf, p, r) {
         override def convertToGpu(childExprs: Seq[Expression]): GpuExpression =
@@ -2344,7 +2510,7 @@ object GpuOverrides extends Logging {
         (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY +
             TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
         TypeSig.all,
-        Seq(ParamCheck("input",
+        Seq(new ParamCheck("input",
           (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY +
               TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
           TypeSig.all))
@@ -2362,7 +2528,7 @@ object GpuOverrides extends Logging {
         (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY +
             TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
         TypeSig.all,
-        Seq(ParamCheck("input",
+        Seq(new ParamCheck("input",
           (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY +
               TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
           TypeSig.all))
@@ -2383,10 +2549,10 @@ object GpuOverrides extends Logging {
           TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
         TypeSig.all,
         Seq(
-          ParamCheck("value", (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY
+          new ParamCheck("value", (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY
             + TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
             TypeSig.all),
-          ParamCheck("ordering", (TypeSig.commonCudfTypes - TypeSig.fp + TypeSig.DECIMAL_128 +
+          new ParamCheck("ordering", (TypeSig.commonCudfTypes - TypeSig.fp + TypeSig.DECIMAL_128 +
             TypeSig.NULL + TypeSig.STRUCT + TypeSig.ARRAY).nested(
               TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
               TypeSig.NULL + TypeSig.STRUCT + TypeSig.ARRAY),
@@ -2412,10 +2578,10 @@ object GpuOverrides extends Logging {
           TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
         TypeSig.all,
         Seq(
-          ParamCheck("value", (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY
+          new ParamCheck("value", (TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY
             + TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128).nested(),
             TypeSig.all),
-          ParamCheck("ordering", (TypeSig.commonCudfTypes - TypeSig.fp + TypeSig.DECIMAL_128 +
+          new ParamCheck("ordering", (TypeSig.commonCudfTypes - TypeSig.fp + TypeSig.DECIMAL_128 +
             TypeSig.NULL + TypeSig.STRUCT + TypeSig.ARRAY).nested(
               TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
               TypeSig.NULL + TypeSig.STRUCT + TypeSig.ARRAY),
@@ -2483,7 +2649,7 @@ object GpuOverrides extends Logging {
         // plugin is also an union of all the types of Pandas UDF.
         (TypeSig.commonCudfTypes + TypeSig.ARRAY).nested() + TypeSig.STRUCT,
         TypeSig.unionOfPandasUdfOut,
-        repeatingParamCheck = Some(RepeatingParamCheck(
+        repeatingParamCheck = Some(new RepeatingParamCheck(
           "param",
           (TypeSig.commonCudfTypes + TypeSig.ARRAY + TypeSig.STRUCT).nested(),
           TypeSig.all))),
@@ -2501,7 +2667,7 @@ object GpuOverrides extends Logging {
     expr[Rand](
       "Generate a random column with i.i.d. uniformly distributed values in [0, 1)",
       ExprChecks.projectOnly(TypeSig.DOUBLE, TypeSig.DOUBLE,
-        Seq(ParamCheck("seed",
+        Seq(new ParamCheck("seed",
           (TypeSig.INT + TypeSig.LONG).withAllLit(),
           (TypeSig.INT + TypeSig.LONG).withAllLit()))),
       (a, conf, p, r) => new UnaryExprMeta[Rand](a, conf, p, r) {
@@ -2578,9 +2744,9 @@ object GpuOverrides extends Logging {
     expr[StringLPad](
       "Pad a string on the left",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("len", TypeSig.lit(TypeEnum.INT), TypeSig.INT),
-          ParamCheck("pad", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("len", TypeSig.lit(TypeEnum.INT), TypeSig.INT),
+          new ParamCheck("pad", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (in, conf, p, r) => new TernaryExprMeta[StringLPad](in, conf, p, r) {
         override def tagExprForGpu(): Unit = {
           extractLit(in.pad).foreach { padLit =>
@@ -2599,9 +2765,9 @@ object GpuOverrides extends Logging {
     expr[StringRPad](
       "Pad a string on the right",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("len", TypeSig.lit(TypeEnum.INT), TypeSig.INT),
-          ParamCheck("pad", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("len", TypeSig.lit(TypeEnum.INT), TypeSig.INT),
+          new ParamCheck("pad", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (in, conf, p, r) => new TernaryExprMeta[StringRPad](in, conf, p, r) {
         override def tagExprForGpu(): Unit = {
           extractLit(in.pad).foreach { padLit =>
@@ -2622,11 +2788,11 @@ object GpuOverrides extends Logging {
       // Java's split API produces different behaviors than cudf when splitting with empty pattern
       ExprChecks.projectOnly(TypeSig.ARRAY.nested(TypeSig.STRING),
         TypeSig.ARRAY.nested(TypeSig.STRING),
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("regexp", TypeSig.lit(TypeEnum.STRING)
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("regexp", TypeSig.lit(TypeEnum.STRING)
               .withPsNote(TypeEnum.STRING, "very limited subset of regex supported"),
             TypeSig.STRING),
-          ParamCheck("limit", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
+          new ParamCheck("limit", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
       (in, conf, p, r) => new GpuStringSplitMeta(in, conf, p, r)),
     expr[GetStructField](
       "Gets the named field of the struct",
@@ -2721,7 +2887,7 @@ object GpuOverrides extends Logging {
       (in, conf, p, r) => new UnaryExprMeta[MapFromEntries](in, conf, p, r) {
         override def tagExprForGpu(): Unit = {
           // Spark 4.1+ returns an enum value instead of String, so use toString first
-          SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY).toString.toUpperCase match {
+          confValueToString(SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY)).toUpperCase match {
             case "EXCEPTION" | "LAST_WIN" => // Good we can support this
             case other =>
               willNotWorkOnGpu(s"$other is not supported for config setting" +
@@ -2735,9 +2901,15 @@ object GpuOverrides extends Logging {
       "Creates a map after splitting the input string into pairs of key-value strings",
       // Java's split API produces different behaviors than cudf when splitting with empty pattern
       ExprChecks.projectOnly(TypeSig.MAP.nested(TypeSig.STRING), TypeSig.MAP.nested(TypeSig.STRING),
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("pairDelim", TypeSig.lit(TypeEnum.STRING), TypeSig.lit(TypeEnum.STRING)),
-          ParamCheck("keyValueDelim", TypeSig.lit(TypeEnum.STRING), TypeSig.lit(TypeEnum.STRING)))),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck(
+            "pairDelim",
+            TypeSig.lit(TypeEnum.STRING),
+            TypeSig.lit(TypeEnum.STRING)),
+          new ParamCheck(
+            "keyValueDelim",
+            TypeSig.lit(TypeEnum.STRING),
+            TypeSig.lit(TypeEnum.STRING)))),
       (in, conf, p, r) => new GpuStringToMapMeta(in, conf, p, r)),
     expr[ArrayMin](
       "Returns the minimum value in the array",
@@ -2830,7 +3002,7 @@ object GpuOverrides extends Logging {
           TypeSig.NULL + TypeSig.STRING + TypeSig.BOOLEAN + TypeSig.DATE + TypeSig.TIMESTAMP +
           TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.BINARY),
         TypeSig.ARRAY.nested(TypeSig.all),
-        repeatingParamCheck = Some(RepeatingParamCheck("arg",
+        repeatingParamCheck = Some(new RepeatingParamCheck("arg",
           TypeSig.gpuNumeric + TypeSig.NULL + TypeSig.STRING +
               TypeSig.BOOLEAN + TypeSig.DATE + TypeSig.TIMESTAMP + TypeSig.STRUCT + TypeSig.BINARY +
               TypeSig.ARRAY.nested(TypeSig.gpuNumeric + TypeSig.NULL + TypeSig.STRING +
@@ -2858,7 +3030,7 @@ object GpuOverrides extends Logging {
         TypeSig.ARRAY.nested(TypeSig.orderable),
         TypeSig.ARRAY.nested(TypeSig.orderable),
         TypeSig.ARRAY.nested(TypeSig.orderable)),
-      GpuArrayDistinctMeta),
+      (expr, conf, p, r) => new GpuArrayDistinctMeta(expr, conf, p, r)),
     expr[Flatten](
       "Creates a single array from an array of arrays",
       ExprChecks.unaryProject(
@@ -2876,11 +3048,11 @@ object GpuOverrides extends Logging {
         (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.BINARY +
             TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(),
         TypeSig.all,
-        Seq(ParamCheck("function",
+        Seq(new ParamCheck("function",
           (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.BINARY +
               TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(),
           TypeSig.all)),
-        Some(RepeatingParamCheck("arguments",
+        Some(new RepeatingParamCheck("arguments",
           (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.BINARY +
               TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(),
           TypeSig.all))),
@@ -2912,11 +3084,11 @@ object GpuOverrides extends Logging {
         TypeSig.MAP),
         TypeSig.ARRAY.nested(TypeSig.all),
         Seq(
-          ParamCheck("argument",
+          new ParamCheck("argument",
             TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.ARRAY.nested(TypeSig.all)),
-          ParamCheck("function",
+          new ParamCheck("function",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(),
             TypeSig.all))),
@@ -2929,11 +3101,11 @@ object GpuOverrides extends Logging {
       "Return true if any element satisfies the predicate LambdaFunction",
       ExprChecks.projectOnly(TypeSig.BOOLEAN, TypeSig.BOOLEAN,
         Seq(
-          ParamCheck("argument",
+          new ParamCheck("argument",
             TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.ARRAY.nested(TypeSig.all)),
-          ParamCheck("function", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
+          new ParamCheck("function", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
       (in, conf, p, r) => new ExprMeta[ArrayExists](in, conf, p, r) {
         override def convertToGpuImpl(): GpuExpression = {
           GpuArrayExists(
@@ -2950,11 +3122,11 @@ object GpuOverrides extends Logging {
         TypeSig.MAP),
         TypeSig.ARRAY.nested(TypeSig.all),
         Seq(
-          ParamCheck("argument",
+          new ParamCheck("argument",
             TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
               TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.ARRAY.nested(TypeSig.all)),
-          ParamCheck("function", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
+          new ParamCheck("function", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
       (in, conf, p, r) => new ExprMeta[ArrayFilter](in, conf, p, r) {
         override def convertToGpuImpl(): GpuExpression = {
           GpuArrayFilter(
@@ -2978,17 +3150,17 @@ object GpuOverrides extends Logging {
         TypeSig.commonCudfTypes + TypeSig.DECIMAL_128,
         TypeSig.all,
         Seq(
-          ParamCheck("argument",
+          new ParamCheck("argument",
             TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.STRUCT),
             TypeSig.ARRAY.nested(TypeSig.all)),
-          ParamCheck("zero",
+          new ParamCheck("zero",
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128,
             TypeSig.all),
-          ParamCheck("merge",
+          new ParamCheck("merge",
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128,
             TypeSig.all),
-          ParamCheck("finish",
+          new ParamCheck("finish",
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128,
             TypeSig.all))),
       (in, conf, p, r) => new GpuArrayAggregateMeta(in, conf, p, r)),
@@ -3000,7 +3172,7 @@ object GpuOverrides extends Logging {
         TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL + TypeSig.BINARY +
           TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.ARRAY.nested(TypeSig.all),
-        repeatingParamCheck = Some(RepeatingParamCheck("children",
+        repeatingParamCheck = Some(new RepeatingParamCheck("children",
           TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
             TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
           TypeSig.ARRAY.nested(TypeSig.all)))),
@@ -3131,7 +3303,7 @@ object GpuOverrides extends Logging {
           TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
             TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
           TypeSig.ARRAY.nested(TypeSig.all))),
-      GpuMapFromArraysMeta
+      (expr, conf, p, r) => new GpuMapFromArraysMeta(expr, conf, p, r)
     ),
     expr[TransformKeys](
       "Transform keys in a map using a transform function",
@@ -3139,18 +3311,18 @@ object GpuOverrides extends Logging {
           TypeSig.NULL + TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.MAP.nested(TypeSig.all),
         Seq(
-          ParamCheck("argument",
+          new ParamCheck("argument",
             TypeSig.MAP.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.MAP.nested(TypeSig.all)),
-          ParamCheck("function",
+          new ParamCheck("function",
             // We need to be able to check for duplicate keys (equality)
             TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL,
             TypeSig.all - TypeSig.MAP.nested()))),
       (in, conf, p, r) => new ExprMeta[TransformKeys](in, conf, p, r) {
         override def tagExprForGpu(): Unit = {
           // Spark 4.1+ returns an enum value instead of String, so use toString first
-          SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY).toString.toUpperCase match {
+          confValueToString(SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY)).toUpperCase match {
             case "EXCEPTION"| "LAST_WIN" => // Good we can support this
             case other =>
               willNotWorkOnGpu(s"$other is not supported for config setting" +
@@ -3167,11 +3339,11 @@ object GpuOverrides extends Logging {
           TypeSig.NULL + TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.MAP.nested(TypeSig.all),
         Seq(
-          ParamCheck("argument",
+          new ParamCheck("argument",
             TypeSig.MAP.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.MAP.nested(TypeSig.all)),
-          ParamCheck("function",
+          new ParamCheck("function",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(),
             TypeSig.all))),
@@ -3186,15 +3358,15 @@ object GpuOverrides extends Logging {
           TypeSig.NULL + TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.MAP.nested(TypeSig.all),
         Seq(
-          ParamCheck("argument1",
+          new ParamCheck("argument1",
             TypeSig.MAP.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.MAP.nested(TypeSig.all)),
-          ParamCheck("argument2",
+          new ParamCheck("argument2",
             TypeSig.MAP.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.MAP.nested(TypeSig.all)),
-          ParamCheck("function",
+          new ParamCheck("function",
             (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(),
             TypeSig.all))),
@@ -3210,11 +3382,11 @@ object GpuOverrides extends Logging {
           TypeSig.NULL + TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.MAP.nested(TypeSig.all),
         Seq(
-          ParamCheck("argument",
+          new ParamCheck("argument",
             TypeSig.MAP.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.MAP.nested(TypeSig.all)),
-          ParamCheck("function", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
+          new ParamCheck("function", TypeSig.BOOLEAN, TypeSig.BOOLEAN))),
       (in, conf, p, r) => new ExprMeta[MapFilter](in, conf, p, r) {
         override def convertToGpuImpl(): GpuExpression = {
           GpuMapFilter(childExprs.head.convertToGpu(), childExprs(1).convertToGpu())
@@ -3223,9 +3395,9 @@ object GpuOverrides extends Logging {
     expr[StringLocate](
       "Substring search operator",
       ExprChecks.projectOnly(TypeSig.INT, TypeSig.INT,
-        Seq(ParamCheck("substr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
-          ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("start", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
+        Seq(new ParamCheck("substr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
+          new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("start", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
       (in, conf, p, r) => new TernaryExprMeta[StringLocate](in, conf, p, r) {
         override def convertToGpu(
             val0: Expression,
@@ -3236,8 +3408,8 @@ object GpuOverrides extends Logging {
     expr[StringInstr](
       "Instr string operator",
       ExprChecks.projectOnly(TypeSig.INT, TypeSig.INT,
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-            ParamCheck("substr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+            new ParamCheck("substr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (in, conf, p, r) => new BinaryExprMeta[StringInstr](in, conf, p, r) {
         override def convertToGpu(
             str: Expression,
@@ -3247,9 +3419,9 @@ object GpuOverrides extends Logging {
     expr[Substring](
       "Substring operator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING + TypeSig.BINARY,
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING + TypeSig.BINARY),
-          ParamCheck("pos", TypeSig.INT, TypeSig.INT),
-          ParamCheck("len", TypeSig.INT, TypeSig.INT))),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING + TypeSig.BINARY),
+          new ParamCheck("pos", TypeSig.INT, TypeSig.INT),
+          new ParamCheck("len", TypeSig.INT, TypeSig.INT))),
       (in, conf, p, r) => new TernaryExprMeta[Substring](in, conf, p, r) {
         override def convertToGpu(
             column: Expression,
@@ -3260,16 +3432,16 @@ object GpuOverrides extends Logging {
     expr[SubstringIndex](
       "substring_index operator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("delim", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
-          ParamCheck("count", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("delim", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
+          new ParamCheck("count", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
       (in, conf, p, r) => new SubstringIndexMeta(in, conf, p, r)),
     expr[StringRepeat](
       "StringRepeat operator that repeats the given strings with numbers of times " +
         "given by repeatTimes",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("input", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("repeatTimes", TypeSig.INT, TypeSig.INT))),
+        Seq(new ParamCheck("input", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("repeatTimes", TypeSig.INT, TypeSig.INT))),
       (in, conf, p, r) => new BinaryExprMeta[StringRepeat](in, conf, p, r) {
         override def convertToGpu(
             input: Expression,
@@ -3278,9 +3450,9 @@ object GpuOverrides extends Logging {
     expr[StringReplace](
       "StringReplace operator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("src", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("search", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("replace", TypeSig.STRING, TypeSig.STRING))),
+        Seq(new ParamCheck("src", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("search", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("replace", TypeSig.STRING, TypeSig.STRING))),
       (in, conf, p, r) => new TernaryExprMeta[StringReplace](in, conf, p, r) {
         override def convertToGpu(
             column: Expression,
@@ -3291,9 +3463,9 @@ object GpuOverrides extends Logging {
     expr[StringTrim](
       "StringTrim operator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("src", TypeSig.STRING, TypeSig.STRING)),
+        Seq(new ParamCheck("src", TypeSig.STRING, TypeSig.STRING)),
         // Should really be an OptionalParam
-        Some(RepeatingParamCheck("trimStr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Some(new RepeatingParamCheck("trimStr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (in, conf, p, r) => new String2TrimExpressionMeta[StringTrim](in, conf, p, r) {
         override def convertToGpu(
             column: Expression,
@@ -3303,9 +3475,9 @@ object GpuOverrides extends Logging {
     expr[StringTrimLeft](
       "StringTrimLeft operator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("src", TypeSig.STRING, TypeSig.STRING)),
+        Seq(new ParamCheck("src", TypeSig.STRING, TypeSig.STRING)),
         // Should really be an OptionalParam
-        Some(RepeatingParamCheck("trimStr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Some(new RepeatingParamCheck("trimStr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (in, conf, p, r) =>
         new String2TrimExpressionMeta[StringTrimLeft](in, conf, p, r) {
           override def convertToGpu(
@@ -3316,9 +3488,9 @@ object GpuOverrides extends Logging {
     expr[StringTrimRight](
       "StringTrimRight operator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("src", TypeSig.STRING, TypeSig.STRING)),
+        Seq(new ParamCheck("src", TypeSig.STRING, TypeSig.STRING)),
         // Should really be an OptionalParam
-        Some(RepeatingParamCheck("trimStr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Some(new RepeatingParamCheck("trimStr", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (in, conf, p, r) =>
         new String2TrimExpressionMeta[StringTrimRight](in, conf, p, r) {
           override def convertToGpu(
@@ -3329,9 +3501,9 @@ object GpuOverrides extends Logging {
     expr[StringTranslate](
       "StringTranslate operator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("input", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("from", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
-          ParamCheck("to", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Seq(new ParamCheck("input", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("from", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
+          new ParamCheck("to", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (in, conf, p, r) => new TernaryExprMeta[StringTranslate](in, conf, p, r) {
         override def convertToGpu(
             input: Expression,
@@ -3365,7 +3537,7 @@ object GpuOverrides extends Logging {
         TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
             TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP + TypeSig.BINARY),
         (TypeSig.STRING + TypeSig.BINARY + TypeSig.ARRAY).nested(TypeSig.all),
-        repeatingParamCheck = Some(RepeatingParamCheck("input",
+        repeatingParamCheck = Some(new RepeatingParamCheck("input",
           (TypeSig.STRING + TypeSig.ARRAY).nested(
             TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
                 TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP + TypeSig.BINARY),
@@ -3378,15 +3550,15 @@ object GpuOverrides extends Logging {
       pluginChecks = ExprChecks.projectOnly(
         outputCheck = TypeSig.STRING,
         paramCheck = Seq(
-          ParamCheck(
+          new ParamCheck(
             name = "num",
             cudf = TypeSig.STRING,
             spark = TypeSig.STRING),
-          ParamCheck(
+          new ParamCheck(
             name = "from_base",
             cudf = TypeSig.INT,
             spark = TypeSig.INT),
-          ParamCheck(
+          new ParamCheck(
             name = "to_base",
             cudf = TypeSig.INT,
             spark = TypeSig.INT)),
@@ -3419,7 +3591,7 @@ object GpuOverrides extends Logging {
       ExprChecks.projectOnly(TypeSig.MAP.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
           TypeSig.NULL + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.MAP.nested(TypeSig.all),
-        repeatingParamCheck = Some(RepeatingParamCheck("input",
+        repeatingParamCheck = Some(new RepeatingParamCheck("input",
           TypeSig.MAP.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
           TypeSig.NULL + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
           TypeSig.MAP.nested(TypeSig.all)))),
@@ -3433,12 +3605,12 @@ object GpuOverrides extends Logging {
           TypeSig.NULL + TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.ARRAY.nested(TypeSig.all),
         Seq(
-          ParamCheck("x",
+          new ParamCheck("x",
             TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
                 TypeSig.BINARY + TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
             TypeSig.ARRAY.nested(TypeSig.all)),
-          ParamCheck("start", TypeSig.INT, TypeSig.INT),
-          ParamCheck("length", TypeSig.INT, TypeSig.INT))),
+          new ParamCheck("start", TypeSig.INT, TypeSig.INT),
+          new ParamCheck("length", TypeSig.INT, TypeSig.INT))),
       (in, conf, p, r) => new TernaryExprMeta[Slice](in, conf, p, r) {
         override def convertToGpu(
             x: Expression,
@@ -3451,13 +3623,13 @@ object GpuOverrides extends Logging {
         "string to replace nulls. If no value is set for nullReplacement, any null value " +
         "is filtered.",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("array",
+        Seq(new ParamCheck("array",
           TypeSig.ARRAY.nested(TypeSig.STRING),
           TypeSig.ARRAY.nested(TypeSig.STRING)),
-          ParamCheck("delimiter",
+          new ParamCheck("delimiter",
             TypeSig.STRING,
             TypeSig.STRING)),
-        repeatingParamCheck = Some(RepeatingParamCheck("nullReplacement",
+        repeatingParamCheck = Some(new RepeatingParamCheck("nullReplacement",
           TypeSig.lit(TypeEnum.STRING),
           TypeSig.STRING))),
       (a, conf, p, r) => new ExprMeta[ArrayJoin](a, conf, p, r) {
@@ -3475,7 +3647,7 @@ object GpuOverrides extends Logging {
       "Concatenates multiple input strings or array of strings into a single " +
         "string using a given separator",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        repeatingParamCheck = Some(RepeatingParamCheck("input",
+        repeatingParamCheck = Some(new RepeatingParamCheck("input",
           (TypeSig.STRING + TypeSig.ARRAY).nested(TypeSig.STRING),
           (TypeSig.STRING + TypeSig.ARRAY).nested(TypeSig.STRING)))),
       (a, conf, p, r) => new ExprMeta[ConcatWs](a, conf, p, r) {
@@ -3493,15 +3665,15 @@ object GpuOverrides extends Logging {
     expr[Murmur3Hash](
       "Murmur3 hash operator",
       HashExprChecks.murmur3ProjectChecks,
-      Murmur3HashExprMeta.apply),
+      ((expr, conf, parent, rule) => new Murmur3HashExprMeta(expr, conf, parent, rule))),
     expr[XxHash64](
       "xxhash64 hash operator",
       HashExprChecks.xxhash64ProjectChecks,
-      XxHash64ExprMeta.apply),
+      ((expr, conf, parent, rule) => new XxHash64ExprMeta(expr, conf, parent, rule))),
     expr[HiveHash](
       "hive hash operator",
       ExprChecks.projectOnly(TypeSig.INT, TypeSig.INT,
-        repeatingParamCheck = Some(RepeatingParamCheck("input",
+        repeatingParamCheck = Some(new RepeatingParamCheck("input",
           (TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.STRUCT + TypeSig.ARRAY).nested() +
               TypeSig.psNote(TypeEnum.ARRAY, "The nesting depth has a certain limit") +
               TypeSig.psNote(TypeEnum.STRUCT, "The nesting depth has a certain limit"),
@@ -3582,38 +3754,38 @@ object GpuOverrides extends Logging {
     expr[RegExpReplace](
       "String replace using a regular expression pattern",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("regex", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
-          ParamCheck("rep", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
-          ParamCheck("pos", TypeSig.lit(TypeEnum.INT)
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("regex", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
+          new ParamCheck("rep", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
+          new ParamCheck("pos", TypeSig.lit(TypeEnum.INT)
               .withPsNote(TypeEnum.INT, "only a value of 1 is supported"),
             TypeSig.lit(TypeEnum.INT)))),
       (a, conf, p, r) => new GpuRegExpReplaceMeta(a, conf, p, r)),
     expr[RegExpExtract](
       "Extract a specific group identified by a regular expression",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("regexp", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
-          ParamCheck("idx", TypeSig.lit(TypeEnum.INT),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("regexp", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
+          new ParamCheck("idx", TypeSig.lit(TypeEnum.INT),
             TypeSig.lit(TypeEnum.INT)))),
       (a, conf, p, r) => new GpuRegExpExtractMeta(a, conf, p, r)),
     expr[RegExpExtractAll](
       "Extract all strings matching a regular expression corresponding to the regex group index",
       ExprChecks.projectOnly(TypeSig.ARRAY.nested(TypeSig.STRING),
         TypeSig.ARRAY.nested(TypeSig.STRING),
-        Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("regexp", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
-          ParamCheck("idx", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
+        Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("regexp", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING),
+          new ParamCheck("idx", TypeSig.lit(TypeEnum.INT), TypeSig.INT))),
       (a, conf, p, r) => new GpuRegExpExtractAllMeta(a, conf, p, r)),
     expr[ParseUrl](
       "Extracts a part from a URL",
       ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING,
-        Seq(ParamCheck("url", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("partToExtract", TypeSig.lit(TypeEnum.STRING).withPsNote(
+        Seq(new ParamCheck("url", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("partToExtract", TypeSig.lit(TypeEnum.STRING).withPsNote(
             TypeEnum.STRING, "only support partToExtract = PROTOCOL | HOST | QUERY | PATH"),
             TypeSig.STRING)),
           // Should really be an OptionalParam
-          Some(RepeatingParamCheck("key", TypeSig.STRING, TypeSig.STRING))),
+          Some(new RepeatingParamCheck("key", TypeSig.STRING, TypeSig.STRING))),
       (a, conf, p, r) => new ExprMeta[ParseUrl](a, conf, p, r) {
         override def tagExprForGpu(): Unit = {
 
@@ -3726,8 +3898,8 @@ object GpuOverrides extends Logging {
         TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
             TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP),
         TypeSig.ARRAY.nested(TypeSig.all),
-        Seq(ParamCheck("n", TypeSig.lit(TypeEnum.INT), TypeSig.INT)),
-        Some(RepeatingParamCheck("expr",
+        Seq(new ParamCheck("n", TypeSig.lit(TypeEnum.INT), TypeSig.INT)),
+        Some(new RepeatingParamCheck("expr",
           (TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
               TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(),
           TypeSig.all))),
@@ -3739,7 +3911,7 @@ object GpuOverrides extends Logging {
         TypeSig.ARRAY.nested(TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
             TypeSig.ARRAY + TypeSig.STRUCT),
         TypeSig.ARRAY.nested(TypeSig.all),
-        repeatingParamCheck = Some(RepeatingParamCheck("input",
+        repeatingParamCheck = Some(new RepeatingParamCheck("input",
           (TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
               TypeSig.ARRAY + TypeSig.STRUCT).nested(),
           TypeSig.all))),
@@ -3755,7 +3927,7 @@ object GpuOverrides extends Logging {
             .withPsNote(TypeEnum.ARRAY, "window operations are disabled by default due " +
                 "to extreme memory usage"),
         TypeSig.ARRAY.nested(TypeSig.all),
-        Seq(ParamCheck("input",
+        Seq(new ParamCheck("input",
           (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.BINARY +
               TypeSig.NULL + TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP).nested(),
           TypeSig.all))),
@@ -3796,7 +3968,7 @@ object GpuOverrides extends Logging {
             .withPsNote(TypeEnum.ARRAY, "window operations are disabled by default due " +
                 "to extreme memory usage"),
         TypeSig.ARRAY.nested(TypeSig.all),
-        Seq(ParamCheck("input",
+        Seq(new ParamCheck("input",
           (TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 +
             TypeSig.NULL +
             TypeSig.STRUCT +
@@ -3835,7 +4007,7 @@ object GpuOverrides extends Logging {
       "Aggregation computing population standard deviation",
       ExprChecks.groupByOnly(
         TypeSig.DOUBLE, TypeSig.DOUBLE,
-        Seq(ParamCheck("input", TypeSig.DOUBLE, TypeSig.DOUBLE))),
+        Seq(new ParamCheck("input", TypeSig.DOUBLE, TypeSig.DOUBLE))),
       (a, conf, p, r) => new AggExprMeta[StddevPop](a, conf, p, r) {
         override def convertToGpu(childExprs: Seq[Expression]): GpuExpression = {
           val legacyStatisticalAggregate = SQLConf.get.legacyStatisticalAggregate
@@ -3846,7 +4018,7 @@ object GpuOverrides extends Logging {
       "Aggregation computing sample standard deviation",
       ExprChecks.fullAgg(
           TypeSig.DOUBLE, TypeSig.DOUBLE,
-          Seq(ParamCheck("input", TypeSig.DOUBLE,
+          Seq(new ParamCheck("input", TypeSig.DOUBLE,
             TypeSig.DOUBLE))),
         (a, conf, p, r) => new AggExprMeta[StddevSamp](a, conf, p, r) {
           override def convertToGpu(childExprs: Seq[Expression]): GpuExpression = {
@@ -3858,7 +4030,7 @@ object GpuOverrides extends Logging {
       "Aggregation computing population variance",
       ExprChecks.groupByOnly(
         TypeSig.DOUBLE, TypeSig.DOUBLE,
-        Seq(ParamCheck("input", TypeSig.DOUBLE, TypeSig.DOUBLE))),
+        Seq(new ParamCheck("input", TypeSig.DOUBLE, TypeSig.DOUBLE))),
       (a, conf, p, r) => new AggExprMeta[VariancePop](a, conf, p, r) {
         override def convertToGpu(childExprs: Seq[Expression]): GpuExpression = {
           val legacyStatisticalAggregate = SQLConf.get.legacyStatisticalAggregate
@@ -3869,7 +4041,7 @@ object GpuOverrides extends Logging {
       "Aggregation computing sample variance",
       ExprChecks.groupByOnly(
         TypeSig.DOUBLE, TypeSig.DOUBLE,
-        Seq(ParamCheck("input", TypeSig.DOUBLE, TypeSig.DOUBLE))),
+        Seq(new ParamCheck("input", TypeSig.DOUBLE, TypeSig.DOUBLE))),
       (a, conf, p, r) => new AggExprMeta[VarianceSamp](a, conf, p, r) {
         override def convertToGpu(childExprs: Seq[Expression]): GpuExpression = {
           val legacyStatisticalAggregate = SQLConf.get.legacyStatisticalAggregate
@@ -3886,11 +4058,11 @@ object GpuOverrides extends Logging {
         Seq(
           // ANSI interval types are new in Spark 3.2.0 and are not yet supported by the
           // current GPU implementation.
-          ParamCheck("input", TypeSig.integral + TypeSig.fp, TypeSig.integral + TypeSig.fp),
-          ParamCheck("percentage",
+          new ParamCheck("input", TypeSig.integral + TypeSig.fp, TypeSig.integral + TypeSig.fp),
+          new ParamCheck("percentage",
             TypeSig.lit(TypeEnum.DOUBLE) + TypeSig.ARRAY.nested(TypeSig.lit(TypeEnum.DOUBLE)),
             TypeSig.DOUBLE + TypeSig.ARRAY.nested(TypeSig.DOUBLE)),
-          ParamCheck("frequency",
+          new ParamCheck("frequency",
             TypeSig.LONG + TypeSig.ARRAY.nested(TypeSig.LONG),
             TypeSig.LONG + TypeSig.ARRAY.nested(TypeSig.LONG)))),
       (c, conf, p, r) => new TypedImperativeAggExprMeta[Percentile](c, conf, p, r) {
@@ -3953,13 +4125,13 @@ object GpuOverrides extends Logging {
         TypeSig.cpuNumeric + TypeSig.DATE + TypeSig.TIMESTAMP + TypeSig.ARRAY.nested(
           TypeSig.cpuNumeric + TypeSig.DATE + TypeSig.TIMESTAMP),
         Seq(
-          ParamCheck("input",
+          new ParamCheck("input",
             TypeSig.gpuNumeric,
             TypeSig.cpuNumeric + TypeSig.DATE + TypeSig.TIMESTAMP),
-          ParamCheck("percentage",
+          new ParamCheck("percentage",
             TypeSig.DOUBLE + TypeSig.ARRAY.nested(TypeSig.DOUBLE),
             TypeSig.DOUBLE + TypeSig.ARRAY.nested(TypeSig.DOUBLE)),
-          ParamCheck("accuracy", TypeSig.INT, TypeSig.INT))),
+          new ParamCheck("accuracy", TypeSig.INT, TypeSig.INT))),
       (c, conf, p, r) => new TypedImperativeAggExprMeta[ApproximatePercentile](c, conf, p, r) {
 
         override def tagAggForGpu(): Unit = {
@@ -4000,8 +4172,8 @@ object GpuOverrides extends Logging {
     expr[GetJsonObject](
       "Extracts a json object from path",
       ExprChecks.projectOnly(
-        TypeSig.STRING, TypeSig.STRING, Seq(ParamCheck("json", TypeSig.STRING, TypeSig.STRING),
-          ParamCheck("path", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        TypeSig.STRING, TypeSig.STRING, Seq(new ParamCheck("json", TypeSig.STRING, TypeSig.STRING),
+          new ParamCheck("path", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (a, conf, p, r) => new GpuGetJsonObjectMeta(a, conf, p, r)),
     expr[JsonToStructs](
       "Returns a struct value with the given `jsonStr` and `schema`",
@@ -4011,10 +4183,10 @@ object GpuOverrides extends Logging {
           "MAP only supports keys and values that are of STRING type " +
             "and is only supported at the top level"),
         (TypeSig.STRUCT + TypeSig.MAP + TypeSig.ARRAY).nested(TypeSig.all),
-        Seq(ParamCheck("jsonStr", TypeSig.STRING, TypeSig.STRING))),
+        Seq(new ParamCheck("jsonStr", TypeSig.STRING, TypeSig.STRING))),
       (a, conf, p, r) => new UnaryExprMeta[JsonToStructs](a, conf, p, r) {
         def hasDuplicateFieldNames(dt: DataType): Boolean =
-          TrampolineUtil.dataTypeExistsRecursively(dt, {
+          dataTypeExistsRecursively(dt, {
             case st: StructType =>
               val fn = st.fieldNames
               fn.length != fn.distinct.length
@@ -4022,7 +4194,7 @@ object GpuOverrides extends Logging {
           })
 
         def hasDateTimeType(dt: DataType): Boolean =
-          TrampolineUtil.dataTypeExistsRecursively(dt, t =>
+          dataTypeExistsRecursively(dt, t =>
             t.isInstanceOf[DateType] || t.isInstanceOf[TimestampType]
           )
 
@@ -4056,7 +4228,7 @@ object GpuOverrides extends Logging {
       ExprChecks.projectOnly(
         TypeSig.STRING,
         TypeSig.STRING,
-        Seq(ParamCheck("struct",
+        Seq(new ParamCheck("struct",
           (TypeSig.BOOLEAN + TypeSig.STRING + TypeSig.integral + TypeSig.FLOAT +
             TypeSig.DOUBLE + TypeSig.DATE + TypeSig.TIMESTAMP +
             TypeSig.DECIMAL_128 +
@@ -4077,8 +4249,8 @@ object GpuOverrides extends Logging {
       ExprChecks.projectOnly(
         TypeSig.ARRAY.nested(TypeSig.STRUCT + TypeSig.STRING),
         TypeSig.ARRAY.nested(TypeSig.STRUCT + TypeSig.STRING),
-        Seq(ParamCheck("json", TypeSig.STRING, TypeSig.STRING)),
-        Some(RepeatingParamCheck("field", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
+        Seq(new ParamCheck("json", TypeSig.STRING, TypeSig.STRING)),
+        Some(new RepeatingParamCheck("field", TypeSig.lit(TypeEnum.STRING), TypeSig.STRING))),
       (a, conf, p, r) => new GeneratorExprMeta[JsonTuple](a, conf, p, r) {
         override def tagExprForGpu(): Unit = {
           if (childExprs.length >= 50) {
@@ -4116,11 +4288,14 @@ object GpuOverrides extends Logging {
       ExprChecks.projectOnly(
         TypeSig.ARRAY.nested(TypeSig.integral), TypeSig.ARRAY.nested(TypeSig.integral +
           TypeSig.TIMESTAMP + TypeSig.DATE),
-        Seq(ParamCheck("start", TypeSig.integral, TypeSig.integral + TypeSig.TIMESTAMP +
+        Seq(new ParamCheck("start", TypeSig.integral, TypeSig.integral + TypeSig.TIMESTAMP +
           TypeSig.DATE),
-          ParamCheck("stop", TypeSig.integral, TypeSig.integral + TypeSig.TIMESTAMP +
+          new ParamCheck("stop", TypeSig.integral, TypeSig.integral + TypeSig.TIMESTAMP +
             TypeSig.DATE)),
-        Some(RepeatingParamCheck("step", TypeSig.integral, TypeSig.integral + TypeSig.CALENDAR))),
+        Some(new RepeatingParamCheck(
+          "step",
+          TypeSig.integral,
+          TypeSig.integral + TypeSig.CALENDAR))),
       (a, conf, p, r) => new GpuSequenceMeta(a, conf, p, r)
     ),
     expr[BitLength](
@@ -4174,7 +4349,7 @@ object GpuOverrides extends Logging {
       ExprChecks.reductionAndGroupByAgg(TypeSig.LONG, TypeSig.LONG,
         // HyperLogLogPlusPlus depends on Xxhash64
         // HyperLogLogPlusPlus supports all the types that Xxhash 64 supports
-        Seq(ParamCheck("input",XxHash64Shims.supportedTypes, TypeSig.all))),
+        Seq(new ParamCheck("input",XxHash64Shims.supportedTypes, TypeSig.all))),
       (a, conf, p, r) => new UnaryExprMeta[HyperLogLogPlusPlus](a, conf, p, r) {
 
         // It's the same as Xxhash64
@@ -4218,16 +4393,16 @@ object GpuOverrides extends Logging {
       StaticInvokeCheck,
       (a, conf, p, r) => new StaticInvokeMeta(a, conf, p, r)
     ).note("The supported types are not deterministic since it's a dynamic expression"),
-    SparkShimImpl.ansiCastRule
+    shimExprRule("SparkShimImpl", "ansiCastRule")
   ).collect { case r if r != null => (r.getClassFor.asSubclass(classOf[Expression]), r)}.toMap
 
   // Shim expressions should be last to allow overrides with shim-specific versions
   val expressions: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] =
     commonExpressions ++ TimeStamp.getExprs ++ GpuHiveOverrides.exprs ++
         ZOrderRules.exprs ++ DecimalArithmeticOverrides.exprs ++
-        BloomFilterShims.exprs ++ StringDecodeShims.exprs ++
-        InSubqueryShims.exprs ++ RaiseErrorShim.exprs ++
-        ExternalSource.exprRules ++ SparkShimImpl.getExprs
+        BloomFilterShims.exprs ++ shimExprs("StringDecodeShims") ++
+        shimExprs("InSubqueryShims") ++ shimExprs("RaiseErrorShim") ++
+        ExternalSource.exprRules ++ shimExprRules("SparkShimImpl", "getExprs")
 
   def wrapScan[INPUT <: Scan](
       scan: INPUT,
@@ -4276,7 +4451,7 @@ object GpuOverrides extends Logging {
       })).map(r => (r.getClassFor.asSubclass(classOf[Scan]), r)).toMap
 
   val scans: Map[Class[_ <: Scan], ScanRule[_ <: Scan]] =
-    commonScans ++ SparkShimImpl.getScans ++ ExternalSource.getScans
+    commonScans ++ shimScanRules("SparkShimImpl", "getScans") ++ ExternalSource.getScans
 
   def wrapPart[INPUT <: Partitioning](
       part: INPUT,
@@ -4290,7 +4465,7 @@ object GpuOverrides extends Logging {
     part[HashPartitioning](
       "Hash based partitioning",
       // This needs to match what murmur3 supports.
-      PartChecks(RepeatingParamCheck("hash_key",
+      PartChecks(new RepeatingParamCheck("hash_key",
         (TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
             TypeSig.STRUCT + TypeSig.ARRAY).nested() +
             TypeSig.psNote(TypeEnum.ARRAY, "Arrays of structs are not supported"),
@@ -4314,7 +4489,7 @@ object GpuOverrides extends Logging {
               }
             case Murmur3Mode =>
               val arrayWithStructsHashing = hp.expressions.exists(e =>
-                TrampolineUtil.dataTypeExistsRecursively(e.dataType,
+                dataTypeExistsRecursively(e.dataType,
                   {
                     case ArrayType(_: StructType, _) => true
                     case _ => false
@@ -4334,7 +4509,7 @@ object GpuOverrides extends Logging {
       }),
     part[RangePartitioning](
       "Range partitioning",
-      PartChecks(RepeatingParamCheck("order_key",
+      PartChecks(new RepeatingParamCheck("order_key",
         pluginSupportedOrderableSig + TypeSig.ARRAY.nested(gpuCommonTypes)
            .withPsNote(TypeEnum.ARRAY, "STRUCT is not supported as a child type for ARRAY"),
         TypeSig.orderable)),
@@ -4368,7 +4543,7 @@ object GpuOverrides extends Logging {
   ).map(r => (r.getClassFor.asSubclass(classOf[Partitioning]), r)).toMap
 
   val parts : Map[Class[_ <: Partitioning], PartRule[_ <: Partitioning]] =
-    commonParts ++ SparkShimImpl.getPartitionings
+    commonParts ++ shimPartRules("SparkShimImpl", "getPartitionings")
 
   def wrapDataWriteCmds[INPUT <: DataWritingCommand](
       writeCmd: INPUT,
@@ -4387,7 +4562,8 @@ object GpuOverrides extends Logging {
 
   val dataWriteCmds: Map[Class[_ <: DataWritingCommand],
       DataWritingCommandRule[_ <: DataWritingCommand]] =
-    commonDataWriteCmds ++ GpuHiveOverrides.dataWriteCmds ++ SparkShimImpl.getDataWriteCmds
+    commonDataWriteCmds ++ GpuHiveOverrides.dataWriteCmds ++
+      shimDataWriteCmdRules("SparkShimImpl", "getDataWriteCmds")
 
   def runnableCmd[INPUT <: RunnableCommand](
       desc: String,
@@ -4399,6 +4575,14 @@ object GpuOverrides extends Logging {
     new RunnableCommandRule[INPUT](doWrap, desc, tag)
   }
 
+  def runnableCmdFromShim[INPUT <: RunnableCommand](
+      rule: ShimRunnableCommandRule[INPUT],
+      doWrap: (INPUT, RapidsConf, Option[RapidsMeta[_, _, _]], DataFromReplacementRule)
+          => RunnableCommandMeta[INPUT]): RunnableCommandRule[INPUT] = {
+    require(rule != null)
+    runnableCmd(rule.desc, doWrap)(rule.tag)
+  }
+
   def wrapRunnableCmd[INPUT <: RunnableCommand](
       cmd: INPUT,
       conf: RapidsConf,
@@ -4418,7 +4602,7 @@ object GpuOverrides extends Logging {
   val runnableCmds = commonRunnableCmds ++
     GpuHiveOverrides.runnableCmds ++
       ExternalSource.runnableCmds ++
-      SparkShimImpl.getRunnableCmds
+      shimRunnableCmdRules("SparkShimImpl", "getRunnableCmds")
 
   def wrapPlan[INPUT <: SparkPlan](
       plan: INPUT,
@@ -4460,7 +4644,7 @@ object GpuOverrides extends Logging {
         (TypeSig.commonCudfTypes + TypeSig.STRUCT + TypeSig.MAP + TypeSig.ARRAY +
           TypeSig.DECIMAL_128 + TypeSig.BINARY).nested(),
         TypeSig.all),
-      (p, conf, parent, r) => new BatchScanExecMeta(p, conf, parent, r)),
+      (p, conf, parent, r) => newBatchScanExecMeta(p, conf, parent, r)),
     exec[CoalesceExec](
       "The backend for the dataframe coalesce method",
       ExecChecks((gpuCommonTypes + TypeSig.STRUCT + TypeSig.ARRAY +
@@ -4495,7 +4679,7 @@ object GpuOverrides extends Logging {
       // The types below are allowed as inputs and outputs.
       ExecChecks((pluginSupportedOrderableSig +
           TypeSig.ARRAY + TypeSig.STRUCT + TypeSig.MAP).nested(), TypeSig.all),
-      GpuTakeOrderedAndProjectExecMeta),
+      (exec, conf, p, r) => new GpuTakeOrderedAndProjectExecMeta(exec, conf, p, r)),
     exec[LocalLimitExec](
       "Per-partition limiting of results",
       ExecChecks((TypeSig.commonCudfTypes + TypeSig.DECIMAL_128 + TypeSig.NULL +
@@ -4530,7 +4714,7 @@ object GpuOverrides extends Logging {
       ExecChecks((TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.STRUCT + TypeSig.MAP +
           TypeSig.ARRAY + TypeSig.DECIMAL_128 + TypeSig.BINARY +
           GpuTypeShims.additionalCommonOperatorSupportedTypes).nested(), TypeSig.all),
-      GpuFilterExecMeta),
+      (exec, conf, p, r) => new GpuFilterExecMeta(exec, conf, p, r)),
     exec[ShuffleExchangeExec](
       "The backend for most data being exchanged between processes",
       ExecChecks((TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 + TypeSig.BINARY +
@@ -4668,10 +4852,10 @@ object GpuOverrides extends Logging {
           TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP + TypeSig.BINARY).nested(),
         TypeSig.all,
         Map("partitionSpec" ->
-            InputCheck(
+            new InputCheck(
                 TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128 +
                 TypeSig.STRUCT.nested(TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128),
-            TypeSig.all))),
+            TypeSig.all, List.empty))),
       (windowOp, conf, p, r) =>
         new GpuWindowExecMeta(windowOp, conf, p, r)
     ),
@@ -4685,11 +4869,11 @@ object GpuOverrides extends Logging {
     exec[SubqueryBroadcastExec](
       "Plan to collect and transform the broadcast key values",
       ExecChecks(TypeSig.all, TypeSig.all),
-      (s, conf, p, r) => new GpuSubqueryBroadcastMeta(s, conf, p, r)
+      (s, conf, p, r) => newGpuSubqueryBroadcastMeta(s, conf, p, r)
     ),
-    SparkShimImpl.aqeShuffleReaderExec,
+    shimExecRule("SparkShimImpl", "aqeShuffleReaderExec"),
     // AggregateInPandasExec renamed to ArrowAggregatePythonExec in Spark 4.1.0
-    AggregateInPandasExecShims.execRule.orNull,
+    aggregateInPandasExecRule,
     exec[ArrowEvalPythonExec](
       "The backend of the Scalar Pandas UDFs. Accelerates the data transfer between the" +
         " Java process and the Python process. It also supports scheduling GPU resources" +
@@ -4745,8 +4929,8 @@ object GpuOverrides extends Logging {
     neverReplaceExec[DescribeNamespaceExec]("Namespace metadata operation"),
     neverReplaceExec[DropNamespaceExec]("Namespace metadata operation"),
     neverReplaceExec[SetCatalogAndNamespaceExec]("Namespace metadata operation"),
-    SparkShimImpl.neverReplaceShowCurrentNamespaceCommand,
-    ShowNamespacesExecShims.neverReplaceExec.orNull,
+    shimExecRule("SparkShimImpl", "neverReplaceShowCurrentNamespaceCommand"),
+    optionalShimExecRule("ShowNamespacesExecShims", "neverReplaceExec"),
     neverReplaceExec[AlterTableExec]("Table metadata operation"),
     neverReplaceExec[CreateTableExec]("Table metadata operation"),
     neverReplaceExec[DeleteFromTableExec]("Table metadata operation"),
@@ -4763,9 +4947,10 @@ object GpuOverrides extends Logging {
     neverReplaceExec[ShuffleQueryStageExec]("Shuffle query stage")
   ).collect { case r if r != null => (r.getClassFor.asSubclass(classOf[SparkPlan]), r) }.toMap
 
+  // Shim execs at the end; shims get the last word in substitutions.
   lazy val execs: Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]] =
     commonExecs ++ GpuHiveOverrides.execs ++ ExternalSource.execRules ++
-      SparkShimImpl.getExecs // Shim execs at the end; shims get the last word in substitutions.
+      shimExecRules("SparkShimImpl", "getExecs")
 
   def getTimeParserPolicy: TimeParserPolicy = {
     val policy = SQLConf.get.getConfString(SQLConf.LEGACY_TIME_PARSER_POLICY.key, "EXCEPTION")
@@ -4947,7 +5132,17 @@ protected class ExplainPlanImpl extends ExplainPlanBase {
 }
 
 // work around any GpuOverride failures
-object GpuOverrideUtil extends Logging {
+object GpuOverrideUtil {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    log.warn(msg, throwable)
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    log.error(msg, throwable)
+  }
+
   def tryOverride(fn: SparkPlan => SparkPlan): SparkPlan => SparkPlan = { plan =>
     val planOriginal = plan.clone()
     val failOnError = TEST_CONF.get(plan.conf) || !SUPPRESS_PLANNING_FAILURE.get(plan.conf)
@@ -4965,7 +5160,7 @@ object GpuOverrideUtil extends Logging {
 }
 
 /** Tag the initial plan when AQE is enabled */
-case class GpuQueryStagePrepOverrides() extends Rule[SparkPlan] with Logging {
+class GpuQueryStagePrepOverrides extends Rule[SparkPlan] with Serializable {
   override def apply(sparkPlan: SparkPlan): SparkPlan = GpuOverrideUtil.tryOverride { plan =>
     // Exposing a bare exchange at the root is only valid while AQE is preparing a
     // query stage. Tag the exchanges seen in this rule so transition cleanup can
@@ -4979,7 +5174,7 @@ case class GpuQueryStagePrepOverrides() extends Rule[SparkPlan] with Logging {
   }(sparkPlan)
 }
 
-case class GpuOverrides() extends Rule[SparkPlan] with Logging {
+case class GpuOverrides() extends Rule[SparkPlan] {
 
   // Spark calls this method once for the whole plan when AQE is off. When AQE is on, it
   // gets called once for each query stage (where a query stage is an `Exchange`).
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuParquetFileFormat.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuParquetFileFormat.scala
index 19f8709d497..0dcf69ba7a2 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuParquetFileFormat.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuParquetFileFormat.scala
@@ -34,7 +34,6 @@ import org.apache.parquet.hadoop.ParquetOutputFormat.JobSummaryLevel
 import org.apache.parquet.hadoop.codec.CodecConfig
 import org.apache.parquet.hadoop.util.ContextUtil
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.{Row, SparkSession}
 import org.apache.spark.sql.execution.datasources.DataSourceUtils
 import org.apache.spark.sql.execution.datasources.parquet.{ParquetOptions, ParquetWriteSupport}
@@ -192,7 +191,21 @@ object GpuParquetFileFormat {
   }
 }
 
-class GpuParquetFileFormat extends ColumnarFileFormat with Logging {
+class GpuParquetFileFormat extends ColumnarFileFormat {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
   /**
    * Prepares a write job and returns an [[ColumnarOutputWriterFactory]].  Client side job
    * preparation can be put here.  For example, user defined output committer can be configured
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPartitioning.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPartitioning.scala
index 809f0587b11..75684a89e2f 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPartitioning.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPartitioning.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -316,7 +316,8 @@ trait GpuPartitioning extends Partitioning {
           val numCompressedToAdd = emptyOutputIndex - outputIndex
           (0 until numCompressedToAdd).foreach { _ =>
             val compressedTable = compressedTables(compressedTableIndex)
-            outputBatches.append(GpuCompressedColumnVector.from(compressedTable))
+            outputBatches.append(
+              GpuCompressedColumnVector.from(compressedTable.buffer, compressedTable.meta))
             compressedTableIndex += 1
           }
           outputBatches.append(emptyBatch)
@@ -326,7 +327,7 @@ trait GpuPartitioning extends Partitioning {
         // add any compressed batches that remain after the last empty batch
         (compressedTableIndex until compressedTables.length).foreach { i =>
           val ct = compressedTables(i)
-          outputBatches.append(GpuCompressedColumnVector.from(ct))
+          outputBatches.append(GpuCompressedColumnVector.from(ct.buffer, ct.meta))
         }
       }
     }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPostHocResolutionOverrides.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPostHocResolutionOverrides.scala
index eda79ca3e96..458dfa2acf1 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPostHocResolutionOverrides.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuPostHocResolutionOverrides.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -26,7 +26,8 @@ import org.apache.spark.sql.catalyst.rules.Rule
  * phase by `SparkSessionExtensions.injectPostHocResolutionRule`. As its name suggests, it will
  * be applied after the logical plan has been resolved.
  */
-case class GpuPostHocResolutionOverrides(spark: SparkSession) extends Rule[LogicalPlan] {
+class GpuPostHocResolutionOverrides(val spark: SparkSession)
+    extends Rule[LogicalPlan] with Serializable {
 
   @transient private val rapidsConf = new RapidsConf(spark.sessionState.conf)
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRangePartitioner.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRangePartitioner.scala
index c7406227f79..5da50517dea 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRangePartitioner.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRangePartitioner.scala
@@ -27,7 +27,7 @@ import org.apache.spark.rdd.{PartitionPruningRDD, RDD}
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.expressions.codegen.LazilyGeneratedOrdering
-import org.apache.spark.sql.rapids.execution.TrampolineUtil
+import org.apache.spark.sql.rapids.shims.DataTypeUtilsShim
 import org.apache.spark.sql.types.{DataType, IntegerType}
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
@@ -173,7 +173,7 @@ case class GpuRangePartitioner(
     sorter: GpuSorter) extends GpuExpression with ShimExpression with GpuPartitioning {
 
   private lazy val converters = new GpuRowToColumnConverter(
-    TrampolineUtil.fromAttributes(sorter.projectedBatchSchema))
+    DataTypeUtilsShim.fromAttributes(sorter.projectedBatchSchema))
 
   override def nullable: Boolean = false
   override def dataType: DataType = IntegerType
@@ -189,7 +189,7 @@ case class GpuRangePartitioner(
     // Don't make this retry-block avoiding nested try-blocks
     // from computeBoundsAndCloseWithRetry
     withResource(converters.convertBatch(rangeBounds,
-      TrampolineUtil.fromAttributes(sorter.projectedBatchSchema))) { ranges =>
+      DataTypeUtilsShim.fromAttributes(sorter.projectedBatchSchema))) { ranges =>
       withResource(sorter.appendProjectedColumns(cb)) { withExtraColumns =>
         sorter.lowerBound(ranges, withExtraColumns)
       }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadCSVFileFormat.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadCSVFileFormat.scala
index 3ddcec05061..8d9dd910ec7 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadCSVFileFormat.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadCSVFileFormat.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -55,7 +55,7 @@ class GpuReadCSVFileFormat extends CSVFileFormat with GpuReadFileFormatWithMetri
       sqlConf.sessionLocalTimeZone,
       sqlConf.columnNameOfCorruptRecord)
     val rapidsConf = new RapidsConf(sqlConf)
-    val factory = GpuCSVPartitionReaderFactory(
+    val factory = new GpuCSVPartitionReaderFactory(
       sqlConf,
       broadcastedHadoopConf,
       dataSchema,
@@ -80,7 +80,7 @@ class GpuReadCSVFileFormat extends CSVFileFormat with GpuReadFileFormatWithMetri
   }
 }
 
-object GpuReadCSVFileFormat {
+object GpuReadCSVFileFormat extends Serializable {
   def tagSupport(meta: SparkPlanMeta[FileSourceScanExec]): Unit = {
     val fsse = meta.wrapped
     GpuCSVScan.tagSupport(
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadOrcFileFormat.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadOrcFileFormat.scala
index 62a62a1400c..92574f7ac72 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadOrcFileFormat.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuReadOrcFileFormat.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -48,7 +48,7 @@ class GpuReadOrcFileFormat extends OrcFileFormat with GpuReadFileFormatWithMetri
     val sqlConf = sparkSession.sessionState.conf
     val broadcastedHadoopConf =
       sparkSession.sparkContext.broadcast(new SerializableConfiguration(hadoopConf))
-    val factory = GpuOrcPartitionReaderFactory(
+    val factory = new GpuOrcPartitionReaderFactory(
       sqlConf,
       broadcastedHadoopConf,
       dataSchema,
@@ -68,7 +68,7 @@ class GpuReadOrcFileFormat extends OrcFileFormat with GpuReadFileFormatWithMetri
       pushedFilters: Array[Filter],
       fileScan: GpuFileSourceScanExec): PartitionReaderFactory = {
     val poolConfBuilder = ThreadPoolConfBuilder(fileScan.rapidsConf)
-    GpuOrcMultiFilePartitionReaderFactory(
+    new GpuOrcMultiFilePartitionReaderFactory(
       fileScan.conf,
       broadcastedConf,
       fileScan.relation.dataSchema,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRowToColumnarExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRowToColumnarExec.scala
index 8e61fa1c9b9..405571ba1ab 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRowToColumnarExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRowToColumnarExec.scala
@@ -23,7 +23,6 @@ import com.nvidia.spark.rapids.shims.{CudfUnsafeRow, GpuTypeShims, ShimUnaryExec
 
 import org.apache.spark.TaskContext
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, BoundReference, SortOrder, SpecializedGetters, UnsafeProjection, UnsafeRow}
@@ -107,22 +106,22 @@ object GpuRowToColumnConverter {
       // NOT SUPPORTED YET
       // case CalendarIntervalType => CalendarConverter
       case (at: ArrayType, true) =>
-        ArrayConverter(getConverterForType(at.elementType, at.containsNull))
+        new ArrayConverter(getConverterForType(at.elementType, at.containsNull))
       case (at: ArrayType, false) =>
-        NotNullArrayConverter(getConverterForType(at.elementType, at.containsNull))
+        new NotNullArrayConverter(getConverterForType(at.elementType, at.containsNull))
       case (st: StructType, true) =>
-        StructConverter(st.fields.map(getConverterFor))
+        new StructConverter(st.fields.map(getConverterFor))
       case (st: StructType, false) =>
-        NotNullStructConverter(st.fields.map(getConverterFor))
+        new NotNullStructConverter(st.fields.map(getConverterFor))
       case (dt: DecimalType, true) =>
         new DecimalConverter(dt.precision, dt.scale)
       case (dt: DecimalType, false) =>
         new NotNullDecimalConverter(dt.precision, dt.scale)
       case (MapType(k, v, vcn), true) =>
-        MapConverter(getConverterForType(k, nullable = false),
+        new MapConverter(getConverterForType(k, nullable = false),
           getConverterForType(v, vcn))
       case (MapType(k, v, vcn), false) =>
-        NotNullMapConverter(getConverterForType(k, nullable = false),
+        new NotNullMapConverter(getConverterForType(k, nullable = false),
           getConverterForType(v, vcn))
       case (NullType, _) =>
         // nullable=false appears only as a synthetic child of empty nested
@@ -404,7 +403,7 @@ object GpuRowToColumnConverter {
     ret + OFFSET
   }
 
-  private case class MapConverter(
+  private class MapConverter(
       keyConverter: TypeConverter,
       valueConverter: TypeConverter) extends TypeConverter {
     override def append(row: SpecializedGetters,
@@ -420,7 +419,7 @@ object GpuRowToColumnConverter {
     override def getNullSize: Double = OFFSET + VALIDITY
   }
 
-  private case class NotNullMapConverter(
+  private class NotNullMapConverter(
       keyConverter: TypeConverter,
       valueConverter: TypeConverter) extends TypeConverter {
     override def append(row: SpecializedGetters,
@@ -462,7 +461,7 @@ object GpuRowToColumnConverter {
     ret + OFFSET
   }
 
-  private case class ArrayConverter(childConverter: TypeConverter)
+  private class ArrayConverter(childConverter: TypeConverter)
       extends TypeConverter {
     override def append(row: SpecializedGetters,
         column: Int, builder: RapidsHostColumnBuilder): Double = {
@@ -477,7 +476,7 @@ object GpuRowToColumnConverter {
     override def getNullSize: Double = OFFSET + VALIDITY
   }
 
-  private case class NotNullArrayConverter(childConverter: TypeConverter)
+  private class NotNullArrayConverter(childConverter: TypeConverter)
       extends TypeConverter {
     override def append(row: SpecializedGetters,
         column: Int, builder: RapidsHostColumnBuilder): Double = {
@@ -501,7 +500,7 @@ object GpuRowToColumnConverter {
     ret
   }
 
-  private case class StructConverter(
+  private class StructConverter(
       childConverters: Array[TypeConverter]) extends TypeConverter {
     override def append(row: SpecializedGetters,
         column: Int,
@@ -518,7 +517,7 @@ object GpuRowToColumnConverter {
     override def getNullSize: Double = childConverters.map(_.getNullSize).sum + VALIDITY
   }
 
-  private case class NotNullStructConverter(
+  private class NotNullStructConverter(
       childConverters: Array[TypeConverter]) extends TypeConverter {
     override def append(row: SpecializedGetters,
         column: Int,
@@ -756,7 +755,17 @@ class RowToColumnarIterator(
 
 }
 
-object GeneratedInternalRowToCudfRowIterator extends Logging {
+object GeneratedInternalRowToCudfRowIterator {
+  private val log = org.slf4j.LoggerFactory.getLogger(
+    GeneratedInternalRowToCudfRowIterator.getClass)
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+
   def apply(input: Iterator[InternalRow],
       schema: Array[Attribute],
       goal: CoalesceSizeGoal,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRunnableCommandExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRunnableCommandExec.scala
index 644acd19fbb..2817d7c710f 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRunnableCommandExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuRunnableCommandExec.scala
@@ -112,7 +112,7 @@ case class GpuRunnableCommandExec(cmd: GpuRunnableCommand, child: SparkPlan)
   override lazy val allMetrics: Map[String, GpuMetric] = GpuMetric.wrap(cmd.metrics)
 
   private lazy val sideEffectResult: Seq[ColumnarBatch] =
-    cmd.runColumnar(sparkSession, child)
+    cmd.runColumnar(sparkSession.asInstanceOf[GpuSparkSession], child)
 
   override def output: Seq[Attribute] = cmd.output
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSemaphore.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSemaphore.scala
index a51aa1c1de7..fd15ed1e858 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSemaphore.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSemaphore.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -29,7 +29,6 @@ import com.nvidia.spark.rapids.jni.{RmmSpark, TaskPriority}
 import com.nvidia.spark.rapids.metrics.GpuBubbleTimerManager
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.rapids.GpuTaskMetrics
 
@@ -49,18 +48,13 @@ case object SemaphoreAcquired extends TryAcquireResult
  * @param numWaitingTasks the number of tasks waiting at the time the request was made.
  *                        Note that this can change very quickly.
  */
-case class AcquireFailed(numWaitingTasks: Int) extends TryAcquireResult
-
-private object GpuTaskMemoryEstimator {
-  private val TIME_WINDOW: Double = TimeUnit.MILLISECONDS.toNanos(100).toDouble
-}
+class AcquireFailed(val numWaitingTasks: Int) extends TryAcquireResult with Serializable
 
 class GpuTaskMemoryEstimator(val stageId: Int,
                              val taskId: Long,
                              val defaultEstimate: Long,
                              val allowDynamicUpdate: Boolean) {
-  import GpuTaskMemoryEstimator._
-
+  private val TIME_WINDOW: Double = TimeUnit.MILLISECONDS.toNanos(100).toDouble
   private val startTimeNanos: Long = System.nanoTime()
   private var totalTimeLost: Long = 0
   private var maxMemory: Long = 0
@@ -318,7 +312,7 @@ object GpuSemaphore {
  */
 private final class SemaphoreTaskInfo(val stageId: Int, val taskAttemptId: Long,
                                       memoryEstimator: GpuStageMemoryEstimator,
-                                      bubbleTimerMgr: GpuBubbleTimerManager) extends Logging {
+                                      bubbleTimerMgr: GpuBubbleTimerManager) {
   /**
    * This holds threads that are not on the GPU yet. Most of the time they are
    * blocked waiting for the semaphore to let them on, but it may hold one
@@ -509,7 +503,23 @@ private final class SemaphoreTaskInfo(val stageId: Int, val taskAttemptId: Long,
   }
 }
 
-private final class GpuSemaphore(val maxConcurrentGpuTasksLimit: Int) extends Logging {
+private final class GpuSemaphore(val maxConcurrentGpuTasksLimit: Int) {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    log.warn(msg, throwable)
+  }
+
 
   import GpuSemaphore._
 
@@ -572,7 +582,7 @@ private final class GpuSemaphore(val maxConcurrentGpuTasksLimit: Int) extends Lo
           numWaiting += 1
         }
       }
-      AcquireFailed(numWaiting)
+      new AcquireFailed(numWaiting)
     }
   }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffleCoalesceExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffleCoalesceExec.scala
index ac12baea358..851345b3dfe 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffleCoalesceExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffleCoalesceExec.scala
@@ -38,7 +38,6 @@ import com.nvidia.spark.rapids.shims.ShimUnaryExecNode
 import org.apache.hadoop.conf.Configuration
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Attribute
@@ -113,7 +112,13 @@ case class CoalesceReadOption private(
     kudoEnabled: Boolean, kudoMode: RapidsConf.ShuffleKudoMode.Value, kudoDebugMode: DumpOption,
     kudoDebugDumpPrefix: Option[String], useAsync: Boolean)
 
-object CoalesceReadOption extends Logging {
+object CoalesceReadOption {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
 
   private def resolveUseAsync(kudoMode: RapidsConf.ShuffleKudoMode.Value,
       useAsync: Boolean): Boolean = {
@@ -190,10 +195,10 @@ object GpuShuffleCoalesceUtils {
       val secondHalfSize = newTargetSize.dataSize - firstHalfSize
 
       Seq(
-        CloseableTableSeqWithTargetSize(firstHalfTables,
-          AutoCloseableTargetSize(targetByteSize, newTargetSize.minSize, firstHalfSize)),
-        CloseableTableSeqWithTargetSize(secondHalfTables,
-          AutoCloseableTargetSize(targetByteSize, newTargetSize.minSize, secondHalfSize))
+        new CloseableTableSeqWithTargetSize(firstHalfTables,
+          new AutoCloseableTargetSize(targetByteSize, newTargetSize.minSize, firstHalfSize)),
+        new CloseableTableSeqWithTargetSize(secondHalfTables,
+          new AutoCloseableTargetSize(targetByteSize, newTargetSize.minSize, secondHalfSize))
       )
     }
   }
@@ -339,7 +344,7 @@ class JCudfTableOperator
   }
 }
 
-case class RowCountOnlyMergeResult(rowCount: Int) extends CoalescedHostResult {
+class RowCountOnlyMergeResult(val rowCount: Int) extends CoalescedHostResult {
   override def toGpuBatch(dataTypes: Array[DataType]): ColumnarBatch = {
     new ColumnarBatch(Array.empty, rowCount)
   }
@@ -367,8 +372,8 @@ class KudoTableOperator(kudo: Option[KudoSerializer], readOption: CoalesceReadOp
     val dumpPrefix = readOption.kudoDebugDumpPrefix
     if (dumpOption != DumpOption.Never && dumpPrefix.isDefined) {
       val updatedPrefix = s"${dumpPrefix.get}_${taskIdentifier}"
-      lazy val (out, path) = createTempFile(new Configuration(), updatedPrefix, ".bin")
-      new MergeOptions(dumpOption, () => out, path.toString)
+      lazy val tempFile = createTempFile(new Configuration(), updatedPrefix, ".bin")
+      new MergeOptions(dumpOption, () => tempFile.getOutputStream, tempFile.getPath.toString)
     } else {
       new MergeOptions(dumpOption, null, null)
     }
@@ -379,7 +384,7 @@ class KudoTableOperator(kudo: Option[KudoSerializer], readOption: CoalesceReadOp
     val numCols = columns.head.spillableKudoTable.header.getNumColumns
     if (numCols == 0) {
       val totalRowsNum = columns.map(getNumRows).sum
-      RowCountOnlyMergeResult(totalRowsNum)
+      new RowCountOnlyMergeResult(totalRowsNum)
     } else {
       // "lock" all input tables in memory before merge
       withResource(columns.safeMap(_.spillableKudoTable.makeKudoTable)) { kudoTables =>
@@ -455,9 +460,9 @@ class KudoGpuTableOperator(dataTypes: Array[DataType])
  * splitting based on byte size when OOM occurs. Extends Seq[T] so it can be
  * used directly as a sequence.
  */
-case class CloseableTableSeqWithTargetSize[T <: AutoCloseable](
-    tables: Seq[T],
-    targetSize: AutoCloseableTargetSize) extends Seq[T] with AutoCloseable {
+class CloseableTableSeqWithTargetSize[T <: AutoCloseable](
+    val tables: Seq[T],
+    val targetSize: AutoCloseableTargetSize) extends Seq[T] with AutoCloseable with Serializable {
   override def close(): Unit = {
     tables.foreach(_.safeClose())
     targetSize.close()
@@ -548,9 +553,9 @@ abstract class CoalesceIteratorBase[T <: AutoCloseable : ClassTag, R <: AutoClos
       splitPolicy match {
         case Some(policy) =>
           val dataSize = tablesSeq.map(tableOperator.getDataLen).sum
-          val targetSizeWrapper = AutoCloseableTargetSize(targetBatchByteSize,
+          val targetSizeWrapper = new AutoCloseableTargetSize(targetBatchByteSize,
             minSplitSizeForRetry, dataSize)
-          val wrapper = CloseableTableSeqWithTargetSize(tablesSeq, targetSizeWrapper)
+          val wrapper = new CloseableTableSeqWithTargetSize(tablesSeq, targetSizeWrapper)
           val wrapperIter = Iterator(wrapper)
           inputIter = Some(wrapperIter)
           val resultIter = withRetry(wrapperIter, policy) { wrappedSeq =>
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledHashJoinExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledHashJoinExec.scala
index e289ad3774b..a4c58f7fe29 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledHashJoinExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledHashJoinExec.scala
@@ -24,7 +24,6 @@ import com.nvidia.spark.rapids.RmmRapidsRetryIterator.withRetryNoSplit
 import com.nvidia.spark.rapids.shims.{GpuHashPartitioning, ShimBinaryExecNode}
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Attribute, Expression}
@@ -282,7 +281,12 @@ case class GpuShuffledHashJoinExec(
   }
 }
 
-object GpuShuffledHashJoinExec extends Logging {
+object GpuShuffledHashJoinExec {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(GpuShuffledHashJoinExec.getClass)
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
+
   /**
    * Return the build data as a single ColumnarBatch when sub-partitioning is not enabled,
    * while as an iterator of ColumnarBatch when sub-partitioning is enabled.
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledSizedHashJoinExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledSizedHashJoinExec.scala
index abc718d83f5..c48901b2d0a 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledSizedHashJoinExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuShuffledSizedHashJoinExec.scala
@@ -156,14 +156,14 @@ object GpuShuffledSizedHashJoinExec {
   }
 
   /** Utility class to track information related to a join. */
-  case class JoinInfo(
-      joinType: JoinType,
-      buildSide: GpuBuildSide,
-      buildIter: Iterator[ColumnarBatch],
-      buildSize: Long,
-      buildStats: Option[JoinBuildSideStats],
-      streamIter: Iterator[ColumnarBatch],
-      exprs: BoundJoinExprs)
+  class JoinInfo(
+      val joinType: JoinType,
+      val buildSide: GpuBuildSide,
+      val buildIter: Iterator[ColumnarBatch],
+      val buildSize: Long,
+      val buildStats: Option[JoinBuildSideStats],
+      val streamIter: Iterator[ColumnarBatch],
+      val exprs: BoundJoinExprs)
 
   /**
    * Trait to house common code for determining the ideal build/stream
@@ -750,7 +750,7 @@ object GpuShuffledSymmetricHashJoinExec {
           val streamIter = new CollectTimeIterator(NvtxRegistry.FETCH_JOIN_STREAM,
             setupForJoin(streamQueue, rawStreamIter, exprs.streamTypes, gpuBatchSizeBytes, metrics),
             streamTime)
-          JoinInfo(joinType, buildSide, buildIter, buildSize, None, streamIter, exprs)
+          new JoinInfo(joinType, buildSide, buildIter, buildSize, None, streamIter, exprs)
         }
       }
     }
@@ -889,12 +889,12 @@ object GpuShuffledAsymmetricHashJoinExec {
         if (streamRows <= Int.MaxValue && streamSize <= gpuBatchSizeBytes) {
           metrics(BUILD_DATA_SIZE).set(streamSize)
           val flippedSide = flipped(buildSide)
-          JoinInfo(joinType, flippedSide, streamIter, streamSize, None, baseBuildIter,
+          new JoinInfo(joinType, flippedSide, streamIter, streamSize, None, baseBuildIter,
             exprs.flipped(joinType, flippedSide, condition, leftOutput, rightOutput, metrics))
         } else {
           val buildIter = addNullFilterIfNecessary(baseBuildIter, exprs.boundBuildKeys,
             exprs.buildSideNeedsNullFilter, metrics)
-          JoinInfo(joinType, buildSide, buildIter, buildSize, None, streamIter, exprs)
+          new JoinInfo(joinType, buildSide, buildIter, buildSize, None, streamIter, exprs)
         }
       }
     }
@@ -923,14 +923,14 @@ object GpuShuffledAsymmetricHashJoinExec {
         metrics(BUILD_DATA_SIZE).set(buildSize)
         val buildIter = addNullFilterIfNecessary(baseBuildIter, exprs.boundBuildKeys,
           exprs.buildSideNeedsNullFilter, metrics)
-        JoinInfo(joinType, buildSide, buildIter, buildSize, None, streamIter, exprs)
+        new JoinInfo(joinType, buildSide, buildIter, buildSize, None, streamIter, exprs)
       } else {
         val buildBatch = getAsSingleBuildBatch(baseBuildIter, exprs, metrics)
         val buildIter = new SingleGpuColumnarBatchIterator(buildBatch)
         val buildStats = JoinBuildSideStats.fromBatch(buildBatch, exprs.boundBuildKeys)
         if (buildStats.streamMagnificationFactor < magnificationThreshold) {
           metrics(BUILD_DATA_SIZE).set(buildSize)
-          JoinInfo(joinType, buildSide, buildIter, buildSize, Some(buildStats), streamIter,
+          new JoinInfo(joinType, buildSide, buildIter, buildSize, Some(buildStats), streamIter,
             exprs)
         } else {
           // The natural build side is explosive, so check the natural stream side to see
@@ -962,25 +962,26 @@ object GpuShuffledAsymmetricHashJoinExec {
                 if (buildStats.streamMagnificationFactor <
                     streamStats.streamMagnificationFactor) {
                   metrics(BUILD_DATA_SIZE).set(buildSize)
-                  JoinInfo(joinType, buildSide, buildIter, buildSize, Some(buildStats),
+                  new JoinInfo(joinType, buildSide, buildIter, buildSize, Some(buildStats),
                     singleStreamIter, exprs)
                 } else {
                   metrics(BUILD_DATA_SIZE).set(streamSize)
                   val flippedSide = flipped(buildSide)
-                  JoinInfo(joinType, flippedSide, singleStreamIter, streamSize, Some(streamStats),
+                  new JoinInfo(
+                    joinType, flippedSide, singleStreamIter, streamSize, Some(streamStats),
                     buildIter, exprs.flipped(joinType, flippedSide, condition,
                       leftOutput, rightOutput, metrics))
                 }
               } else {
                 metrics(BUILD_DATA_SIZE).set(streamSize)
                 val flippedSide = flipped(buildSide)
-                JoinInfo(joinType, flippedSide, streamBatchIter, streamSize, None,
+                new JoinInfo(joinType, flippedSide, streamBatchIter, streamSize, None,
                   buildIter, exprs.flipped(joinType, flippedSide, condition,
                     leftOutput, rightOutput, metrics))
               }
             } else {
               metrics(BUILD_DATA_SIZE).set(buildSize)
-              JoinInfo(joinType, buildSide, buildIter, buildSize, Some(buildStats),
+              new JoinInfo(joinType, buildSide, buildIter, buildSize, Some(buildStats),
                 new SpillableColumnarBatchQueueIterator(streamQueue, streamIter), exprs)
             }
           }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSortExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSortExec.scala
index 9a79151d3cf..828fb32b72e 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSortExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuSortExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -36,7 +36,7 @@ import org.apache.spark.sql.catalyst.plans.physical.{Distribution, OrderedDistri
 import org.apache.spark.sql.execution.{SortExec, SparkPlan}
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.rapids.{GpuWriteJobStatsTracker, GpuWriteTaskStatsTracker}
-import org.apache.spark.sql.rapids.execution.TrampolineUtil
+import org.apache.spark.sql.rapids.shims.DataTypeUtilsShim
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
 sealed trait SortExecType extends Serializable
@@ -141,12 +141,12 @@ case class GpuSortExec(
         tcs.map(_.newTaskInstance().asInstanceOf[GpuWriteTaskStatsTracker])
       }
       val finalIter = if (outOfCore) {
-        val iter = GpuOutOfCoreSortIterator(cbIter, sorter,
+        val iter = new GpuOutOfCoreSortIterator(cbIter, sorter,
           targetSize, opTime, sortTime, outputBatch, outputRows)
         onTaskCompletion(iter.close())
         iter
       } else {
-        GpuSortEachBatchIterator(cbIter, sorter, singleBatch,
+        new GpuSortEachBatchIterator(cbIter, sorter, singleBatch,
           opTime, sortTime, outputBatch, outputRows)
       }
       if (taskTrackers.exists(_.nonEmpty)) {
@@ -165,14 +165,14 @@ case class GpuSortExec(
   }
 }
 
-case class GpuSortEachBatchIterator(
-    iter: Iterator[ColumnarBatch],
-    sorter: GpuSorter,
-    singleBatch: Boolean,
-    opTime: GpuMetric = NoopMetric,
-    sortTime: GpuMetric = NoopMetric,
-    outputBatches: GpuMetric = NoopMetric,
-    outputRows: GpuMetric = NoopMetric) extends Iterator[ColumnarBatch] {
+class GpuSortEachBatchIterator(
+    val iter: Iterator[ColumnarBatch],
+    val sorter: GpuSorter,
+    val singleBatch: Boolean,
+    val opTime: GpuMetric,
+    val sortTime: GpuMetric,
+    val outputBatches: GpuMetric,
+    val outputRows: GpuMetric) extends Iterator[ColumnarBatch] with Serializable {
   override def hasNext: Boolean = iter.hasNext
 
   override def next(): ColumnarBatch = {
@@ -238,8 +238,8 @@ object GpuSpillableProjectedSortEachBatchIterator {
  * Holds data for the out of core sort. It includes the batch of data and the first row in that
  * batch so we can sort the batches.
  */
-case class OutOfCoreBatch(buffer: SpillableColumnarBatch,
-    firstRow: UnsafeRow) extends AutoCloseable {
+class OutOfCoreBatch(val buffer: SpillableColumnarBatch,
+    val firstRow: UnsafeRow) extends AutoCloseable {
   override def close(): Unit = buffer.close()
 }
 
@@ -295,15 +295,15 @@ class Pending(cpuOrd: LazilyGeneratedOrdering) extends AutoCloseable {
  * the merged data is split and put back into a pending queue.  The process repeats until we have
  * enough data to output.
  */
-case class GpuOutOfCoreSortIterator(
-    iter: Iterator[ColumnarBatch],
-    sorter: GpuSorter,
-    targetSize: Long,
-    opTime: GpuMetric,
-    sortTime: GpuMetric,
-    outputBatches: GpuMetric,
-    outputRows: GpuMetric) extends Iterator[ColumnarBatch]
-    with AutoCloseable {
+class GpuOutOfCoreSortIterator(
+    val iter: Iterator[ColumnarBatch],
+    val sorter: GpuSorter,
+    val targetSize: Long,
+    val opTime: GpuMetric,
+    val sortTime: GpuMetric,
+    val outputBatches: GpuMetric,
+    val outputRows: GpuMetric) extends Iterator[ColumnarBatch]
+    with AutoCloseable with Serializable {
 
   /**
    * This has already sorted the data, and it still has the projected columns in it that need to
@@ -328,7 +328,7 @@ case class GpuOutOfCoreSortIterator(
   // Used for converting between rows and columns when we have to put a cuttoff on the GPU
   // to know how much of the data after a merge sort is fully sorted.
   private lazy val converters = new GpuRowToColumnConverter(
-    TrampolineUtil.fromAttributes(sorter.projectedBatchSchema))
+    DataTypeUtilsShim.fromAttributes(sorter.projectedBatchSchema))
 
   /**
    * Convert the boundaries (first rows for each batch) into unsafe rows for use later on.
@@ -434,7 +434,7 @@ case class GpuOutOfCoreSortIterator(
                 if (ct.getRowCount > 0) {
                   val sp = SpillableColumnarBatch(ct, sorter.projectedBatchTypes,
                     SpillPriorities.ACTIVE_ON_DECK_PRIORITY)
-                  pendingObs += OutOfCoreBatch(sp, lower)
+                  pendingObs += new OutOfCoreBatch(sp, lower)
                 } else {
                   ct.close()
                 }
@@ -517,7 +517,7 @@ case class GpuOutOfCoreSortIterator(
           val cutoff = pending.peek().firstRow
           val result = RmmRapidsRetryIterator.withRetryNoSplit[ColumnVector] {
             withResource(converters.convertBatch(Array(cutoff),
-              TrampolineUtil.fromAttributes(sorter.projectedBatchSchema))) { cutoffCb =>
+              DataTypeUtilsShim.fromAttributes(sorter.projectedBatchSchema))) { cutoffCb =>
               withResource(mergedSpillBatch.getColumnarBatch()) { mergedBatch =>
                 sorter.upperBound(mergedBatch, cutoffCb)
               }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuUserDefinedFunction.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuUserDefinedFunction.scala
index eae23b86dd5..b03d082f1c9 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuUserDefinedFunction.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/GpuUserDefinedFunction.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -23,7 +23,6 @@ import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.shims.ShimExpression
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{GenericInternalRow, UserDefinedExpression}
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
@@ -91,7 +90,13 @@ object GpuUserDefinedFunction {
  * and do the processing on CPU.
  */
 trait GpuRowBasedUserDefinedFunction extends GpuExpression
-    with ShimExpression with UserDefinedExpression with Serializable with Logging {
+    with ShimExpression with UserDefinedExpression with Serializable {
+
+  @transient private lazy val log = org.slf4j.LoggerFactory.getLogger(
+    classOf[GpuRowBasedUserDefinedFunction])
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
+
   /** name of the UDF function */
   val name: String
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HashExprMetas.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HashExprMetas.scala
index cd8bc87f032..98b191b32f7 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HashExprMetas.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HashExprMetas.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -24,7 +24,7 @@ import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.sql.types.{ArrayType, StructType}
 
 /** Base meta for Murmur3-hash-like expressions. */
-case class Murmur3HashExprMeta[HEINT <: HashExpression[Int]](
+class Murmur3HashExprMeta[HEINT <: HashExpression[Int]](
     expr: HEINT,
     override val conf: RapidsConf,
     override val parent: Option[RapidsMeta[_, _, _]],
@@ -47,7 +47,7 @@ case class Murmur3HashExprMeta[HEINT <: HashExpression[Int]](
 }
 
 /** Base meta for xxhash64-like expressions. */
-case class XxHash64ExprMeta[HE <: HashExpression[Long]](
+class XxHash64ExprMeta[HE <: HashExpression[Long]](
     expr: HE,
     override val conf: RapidsConf,
     override val parent: Option[RapidsMeta[_, _, _]],
@@ -83,14 +83,14 @@ object HashExprChecks {
 
   val murmur3ProjectChecks: ExprChecks = ExprChecks.projectOnly(
     TypeSig.INT, TypeSig.INT,
-    repeatingParamCheck = Some(RepeatingParamCheck(
+    repeatingParamCheck = Some(new RepeatingParamCheck(
       "input",
       murmur3InputTypes,
       TypeSig.all)))
 
   val xxhash64ProjectChecks: ExprChecks = ExprChecks.projectOnly(
     TypeSig.LONG, TypeSig.LONG,
-    repeatingParamCheck = Some(RepeatingParamCheck(
+    repeatingParamCheck = Some(new RepeatingParamCheck(
       "input",
       XxHash64Shims.supportedTypes,
       TypeSig.all)))
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostAlloc.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostAlloc.scala
index 8086d75c253..1503e291272 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostAlloc.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostAlloc.scala
@@ -28,12 +28,22 @@ import com.nvidia.spark.rapids.jni.{CpuRetryOOM, RmmSpark}
 import com.nvidia.spark.rapids.spill.SpillFramework
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.GpuTaskMetrics
 
-case class HostAllocResult(buffer: HostMemoryBuffer, isPinned: Boolean)
 
-private class HostAlloc(nonPinnedLimit: Long) extends HostMemoryAllocator with Logging {
+private class HostAlloc(nonPinnedLimit: Long) extends HostMemoryAllocator {
+  private def logTrace(msg: => String): Unit = {
+    HostAlloc.logTrace(msg)
+  }
+
+  private def logInfo(msg: => String): Unit = {
+    HostAlloc.logInfo(msg)
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    HostAlloc.logWarning(msg)
+  }
+
   private var currentNonPinnedAllocated: Long = 0L
   private val pinnedLimit: Long = PinnedMemoryPool.getTotalPoolSizeBytes
   // For now we are going to assume that we are the only ones calling into the pinned pool
@@ -205,14 +215,14 @@ private class HostAlloc(nonPinnedLimit: Long) extends HostMemoryAllocator with L
       do {
         ret = (
           if (preferPinned) {
-            tryAllocPinned(amount).map(HostAllocResult(_, isPinned = true))
+            tryAllocPinned(amount).map(buffer => new HostAllocResult(buffer, true))
           } else {
-            tryAllocNonPinned(amount).map(HostAllocResult(_, isPinned = false))
+            tryAllocNonPinned(amount).map(buffer => new HostAllocResult(buffer, false))
           }).orElse {
           if (preferPinned) {
-            tryAllocNonPinned(amount).map(HostAllocResult(_, isPinned = false))
+            tryAllocNonPinned(amount).map(buffer => new HostAllocResult(buffer, false))
           } else {
-            tryAllocPinned(amount).map(HostAllocResult(_, isPinned = true))
+            tryAllocPinned(amount).map(buffer => new HostAllocResult(buffer, true))
           }
         }
         if (ret.isEmpty) {
@@ -226,7 +236,9 @@ private class HostAlloc(nonPinnedLimit: Long) extends HostMemoryAllocator with L
       allocAttemptFinishedWithoutException = true
     } finally {
       ret match {
-        case Some(HostAllocResult(buffer: HostMemoryBuffer, isPinned: Boolean)) =>
+        case Some(result) =>
+          val buffer = result.buffer
+          val isPinned = result.isPinned
           val metrics = GpuTaskMetrics.get
           metrics.incHostBytesAllocated(amount, isPinned)
           if (BOOKKEEP_MEMORY) {
@@ -287,7 +299,25 @@ private class HostAlloc(nonPinnedLimit: Long) extends HostMemoryAllocator with L
 /**
  * A new API for host memory allocation. This can be used to limit the amount of host memory.
  */
-object HostAlloc extends Logging {
+object HostAlloc {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logTrace(msg: => String): Unit = {
+    if (log.isTraceEnabled) {
+      log.trace(msg)
+    }
+  }
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
   private var singleton: HostAlloc = new HostAlloc(-1)
 
   private def getSingleton: HostAlloc = synchronized {
@@ -334,7 +364,7 @@ object HostAlloc extends Logging {
     buff.synchronized {
       val previous = Option(buff.getEventHandler)
       val handlerToSet = previous.map { p =>
-        MultiEventHandler(p, handler)
+        new MultiEventHandler(p, handler)
       }.getOrElse {
         handler
       }
@@ -354,7 +384,7 @@ object HostAlloc extends Logging {
       case oldA: MultiEventHandler =>
         // From how the MultiEventHandler is set up we know that b cannot be one
         val newA = removeEventHandlerFrom(oldA, handler)
-        MultiEventHandler(newA, multiEventHandler.b)
+        new MultiEventHandler(newA, multiEventHandler.b)
       case _ =>
         multiEventHandler
     }
@@ -390,8 +420,8 @@ object HostAlloc extends Logging {
     }
   }
 
-  private case class MultiEventHandler(a: MemoryBuffer.EventHandler,
-                                       b: MemoryBuffer.EventHandler)
+  private class MultiEventHandler(val a: MemoryBuffer.EventHandler,
+                                  val b: MemoryBuffer.EventHandler)
     extends MemoryBuffer.EventHandler {
     override def onClosed(i: Int): Unit = {
       var t: Option[Throwable] = None
@@ -434,7 +464,7 @@ object HostAlloc extends Logging {
     }
     override def remove(addr: Long, amount: Long): Unit = totalMem.add(-amount)
   }
-  private case class MemoryUsageDetail(addr: Long, amount: Long, callStack: String) {
+  private class MemoryUsageDetail(val addr: Long, val amount: Long, val callStack: String) {
     override def toString: String = s"$amount bytes behind address $addr at $callStack"
   }
 
@@ -445,7 +475,7 @@ object HostAlloc extends Logging {
         s"${details.values.mkString("\n")}"
 
     override def add(addr: Long, amount: Long, callstack: String): Unit =
-      details.put(addr, MemoryUsageDetail(addr, amount, callstack))
+      details.put(addr, new MemoryUsageDetail(addr, amount, callstack))
 
     override def remove(addr: Long, amount: Long): Unit =
       details.remove(addr)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostColumnarToGpu.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostColumnarToGpu.scala
index ac4ea77c893..15a20deb01e 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostColumnarToGpu.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostColumnarToGpu.scala
@@ -28,7 +28,6 @@ import org.apache.arrow.memory.{ArrowBuf, ReferenceManager}
 import org.apache.arrow.vector.ValueVector
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Attribute
@@ -38,7 +37,7 @@ import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.{ArrowColumnVector, ColumnarBatch, ColumnVector}
 import org.apache.spark.sql.vectorized.rapids.AccessibleArrowColumnVector
 
-object HostColumnarToGpu extends Logging {
+object HostColumnarToGpu {
 
   // use reflection to get access to a private field in a class
   private def getClassFieldAccessible(className: String, fieldName: String) = {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostMemoryStreams.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostMemoryStreams.scala
index 4be11b13254..2685f11a367 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostMemoryStreams.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/HostMemoryStreams.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -16,97 +16,11 @@
 
 package com.nvidia.spark.rapids
 
-import java.io.{EOFException, InputStream, IOException, OutputStream}
+import java.io.{InputStream, IOException}
 import java.nio.ByteBuffer
-import java.nio.channels.ReadableByteChannel
 
 import ai.rapids.cudf.HostMemoryBuffer
 
-/**
- * An implementation of OutputStream that writes to a HostMemoryBuffer.
- *
- * NOTE: Closing this output stream does NOT close the buffer!
- *
- * @param buffer the buffer to receive written data
- */
-class HostMemoryOutputStream(val buffer: HostMemoryBuffer) extends OutputStream {
-  protected var pos: Long = 0
-
-  override def write(i: Int): Unit = {
-    buffer.setByte(pos, i.toByte)
-    pos += 1
-  }
-
-  override def write(bytes: Array[Byte]): Unit = {
-    buffer.setBytes(pos, bytes, 0, bytes.length)
-    pos += bytes.length
-  }
-
-  override def write(bytes: Array[Byte], offset: Int, len: Int): Unit = {
-    buffer.setBytes(pos, bytes, offset, len)
-    pos += len
-  }
-
-  def write(data: ByteBuffer): Unit = {
-    val numBytes = data.remaining()
-    val outBuffer = buffer.asByteBuffer(pos, numBytes)
-    outBuffer.put(data)
-    pos += numBytes
-  }
-
-  def writeAsByteBuffer(length: Int): ByteBuffer = {
-    val bb = buffer.asByteBuffer(pos, length)
-    pos += length
-    bb
-  }
-
-  def getPos: Long = pos
-
-  def seek(newPos: Long): Unit = {
-    pos = newPos
-  }
-
-  def copyFromChannel(channel: ReadableByteChannel, length: Long): Unit = {
-    val endPos = pos + length
-    assert(endPos <= buffer.getLength)
-    while (pos != endPos) {
-      val bytesToCopy = (endPos - pos).min(Integer.MAX_VALUE).toInt
-      val bytebuf = buffer.asByteBuffer(pos, bytesToCopy)
-      while (bytebuf.hasRemaining) {
-        val channelReadBytes = channel.read(bytebuf)
-        if (channelReadBytes < 0) {
-          throw new EOFException("Unexpected EOF while reading from byte channel")
-        }
-      }
-      pos += bytesToCopy
-    }
-  }
-}
-
-/** A HostMemoryOutputStream only counts the written bytes, nothing is actually written. */
-final class NullHostMemoryOutputStream extends HostMemoryOutputStream(null) {
-  override def write(i: Int): Unit = {
-    pos += 1
-  }
-
-  override def write(bytes: Array[Byte]): Unit = {
-    pos += bytes.length
-  }
-
-  override def write(bytes: Array[Byte], offset: Int, len: Int): Unit = {
-    pos += len
-  }
-
-  override def copyFromChannel(channel: ReadableByteChannel, length: Long): Unit = {
-    val endPos = pos + length
-    while (pos != endPos) {
-      val bytesToCopy = (endPos - pos).min(Integer.MAX_VALUE)
-      pos += bytesToCopy
-    }
-  }
-
-}
-
 trait HostMemoryInputStreamMixIn extends InputStream {
   protected val hmb: HostMemoryBuffer
   protected val hmbLength: Long
@@ -167,16 +81,3 @@ trait HostMemoryInputStreamMixIn extends InputStream {
 
   def getPos: Long = pos
 }
-
-/**
- * An implementation of InputStream that reads from a HostMemoryBuffer.
- *
- * NOTE: Closing this input stream does NOT close the buffer!
- *
- * @param hmb the buffer from which to read data
- * @param hmbLength the amount of data available in the buffer
- */
-class HostMemoryInputStream(
-    val hmb: HostMemoryBuffer,
-    val hmbLength: Long) extends HostMemoryInputStreamMixIn {
-}
\ No newline at end of file
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/InternalExclusiveModeGpuDiscoveryPlugin.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/InternalExclusiveModeGpuDiscoveryPlugin.scala
index 8f5b5ee66b9..b43c6dee487 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/InternalExclusiveModeGpuDiscoveryPlugin.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/InternalExclusiveModeGpuDiscoveryPlugin.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -24,7 +24,6 @@ import ai.rapids.cudf.Cuda
 
 import org.apache.spark.SparkConf
 import org.apache.spark.api.resource.ResourceDiscoveryPlugin
-import org.apache.spark.internal.Logging
 import org.apache.spark.resource.{ResourceInformation, ResourceRequest}
 
 /**
@@ -32,7 +31,23 @@ import org.apache.spark.resource.{ResourceInformation, ResourceRequest}
  * It should be loaded by reflection using ShimLoader.newInstanceOf, see ./docs/dev/shims.md
  */
 protected class InternalExclusiveModeGpuDiscoveryPlugin
-  extends ResourceDiscoveryPlugin with Logging {
+  extends ResourceDiscoveryPlugin {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(
+    classOf[InternalExclusiveModeGpuDiscoveryPlugin])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
   override def discoverResource(
     request: ResourceRequest,
     sparkconf: SparkConf
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/JoinGatherer.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/JoinGatherer.scala
index 5688ee30b30..25c37296c9b 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/JoinGatherer.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/JoinGatherer.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2025, NVIDIA CORPORATION. All rights reserved.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -155,7 +155,7 @@ object JoinGatherer {
       outOfBoundsPolicyRight: OutOfBoundsPolicy): JoinGatherer = {
     val left = JoinGatherer(leftMap, leftData, outOfBoundsPolicyLeft)
     val right = JoinGatherer(rightMap, rightData, outOfBoundsPolicyRight)
-    MultiJoinGather(left, right)
+    new MultiJoinGather(left, right)
   }
 
   def getRowsInNextBatch(gatherer: JoinGatherer, targetSize: Long,
@@ -227,7 +227,7 @@ object LazySpillableColumnarBatch {
 
   def spillOnly(wrapped: LazySpillableColumnarBatch): LazySpillableColumnarBatch = wrapped match {
     case alreadyGood: AllowSpillOnlyLazySpillableColumnarBatchImpl => alreadyGood
-    case anythingElse => AllowSpillOnlyLazySpillableColumnarBatchImpl(anythingElse)
+    case anythingElse => new AllowSpillOnlyLazySpillableColumnarBatchImpl(anythingElse)
   }
 }
 
@@ -236,7 +236,7 @@ object LazySpillableColumnarBatch {
  * batch it is only spilled. This is used for cases, like with a streaming hash join
  * where the data itself needs to out live the JoinGatherer it is handed off to.
  */
-case class AllowSpillOnlyLazySpillableColumnarBatchImpl(wrapped: LazySpillableColumnarBatch)
+class AllowSpillOnlyLazySpillableColumnarBatchImpl(val wrapped: LazySpillableColumnarBatch)
     extends LazySpillableColumnarBatch {
   override def getBatch: ColumnarBatch =
     wrapped.getBatch
@@ -749,7 +749,8 @@ class JoinGathererSameTable(
 /**
  * Join Gatherer for a left table and a right table
  */
-case class MultiJoinGather(left: JoinGatherer, right: JoinGatherer) extends JoinGatherer {
+class MultiJoinGather(val left: JoinGatherer, val right: JoinGatherer)
+    extends JoinGatherer with Serializable {
   assert(left.numRowsLeft == right.numRowsLeft,
     "all gatherers much have the same number of rows to gather")
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MemoryChecker.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MemoryChecker.scala
index 33124b28fdc..65e8e2bbcf2 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MemoryChecker.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MemoryChecker.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -25,7 +25,6 @@ import scala.util.{Failure, Success, Try}
 import com.nvidia.spark.rapids.Arm.withResource
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.Logging
 
 trait MemoryChecker {
   def getAvailableMemoryBytes(rapidsConf: RapidsConf): Option[Long]
@@ -38,7 +37,19 @@ trait MemoryChecker {
  * on which it checks corresponding files, env variables, etc. for memory usage
  * and limits.
  */
-object MemoryCheckerImpl extends MemoryChecker with Logging {
+object MemoryCheckerImpl extends MemoryChecker {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
   def main(args: Array[String]): Unit = {
     val conf = new RapidsConf(new SparkConf())
     println(s"Available memory: ${getAvailableMemoryBytes(conf)} bytes")
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MetaUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MetaUtils.scala
index f1561e2c251..675f355b92b 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MetaUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MetaUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -16,7 +16,7 @@
 
 package com.nvidia.spark.rapids
 
-import java.nio.{ByteBuffer, ByteOrder}
+import java.nio.{Buffer, ByteBuffer, ByteOrder}
 
 import scala.collection.mutable.ArrayBuffer
 
@@ -25,7 +25,6 @@ import com.google.flatbuffers.FlatBufferBuilder
 import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.format._
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.types.DataType
 import org.apache.spark.sql.vectorized.ColumnarBatch
 import org.apache.spark.storage.ShuffleBlockBatchId
@@ -117,9 +116,9 @@ object MetaUtils {
       packedMeta: ByteBuffer,
       numRows: Long): TableMeta = {
     val vectorBuffer = fbb.createUnintializedVector(1, packedMeta.remaining(), 1)
-    packedMeta.mark()
+    packedMeta.asInstanceOf[Buffer].mark()
     vectorBuffer.put(packedMeta)
-    packedMeta.reset()
+    packedMeta.asInstanceOf[Buffer].reset()
     val packedMetaOffset = fbb.endVector()
 
     TableMeta.startTableMeta(fbb)
@@ -262,7 +261,7 @@ class DirectByteBufferFactory extends FlatBufferBuilder.ByteBufferFactory {
   }
 }
 
-object ShuffleMetadata extends Logging{
+object ShuffleMetadata {
 
   val bbFactory = new DirectByteBufferFactory
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MultithreadedShuffleBufferCatalog.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MultithreadedShuffleBufferCatalog.scala
index 35fd66d93ac..4fa7122f9e4 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MultithreadedShuffleBufferCatalog.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/MultithreadedShuffleBufferCatalog.scala
@@ -18,7 +18,7 @@ package com.nvidia.spark.rapids
 
 import java.io.{InputStream, IOException}
 import java.lang.{Boolean => JBoolean}
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 import java.nio.channels.WritableByteChannel
 import java.util.HashSet
 import java.util.concurrent.ConcurrentHashMap
@@ -28,7 +28,6 @@ import scala.collection.mutable.ArrayBuffer
 import _root_.io.netty.handler.stream.ChunkedStream
 import com.nvidia.spark.rapids.spill.SpillablePartialFileHandle
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.network.buffer.ManagedBuffer
 import org.apache.spark.network.util.AbstractFileRegion
 import org.apache.spark.storage.{ShuffleBlockBatchId, ShuffleBlockId}
@@ -40,10 +39,10 @@ import org.apache.spark.storage.{ShuffleBlockBatchId, ShuffleBlockId}
  * @param offset starting offset within the handle
  * @param length number of bytes in this segment
  */
-case class PartitionSegment(
-    handle: SpillablePartialFileHandle,
-    offset: Long,
-    length: Long)
+class PartitionSegment(
+    val handle: SpillablePartialFileHandle,
+    val offset: Long,
+    val length: Long)
 
 /**
  * Catalog for managing shuffle data in MULTITHREADED mode without merging.
@@ -57,7 +56,19 @@ case class PartitionSegment(
  * (MEMORY_WITH_SPILL mode) or stored directly on disk (ONLY_FILE mode) depending
  * on memory pressure - both modes work with this skip-merge design.
  */
-class MultithreadedShuffleBufferCatalog extends Logging {
+class MultithreadedShuffleBufferCatalog {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    log.error(msg, throwable)
+  }
+
 
   /**
    * Map from ShuffleBlockId to list of segments.
@@ -99,7 +110,7 @@ class MultithreadedShuffleBufferCatalog extends Logging {
     }
 
     val blockId = ShuffleBlockId(shuffleId, mapId, partitionId)
-    val segment = PartitionSegment(handle, offset, length)
+    val segment = new PartitionSegment(handle, offset, length)
 
     partitionSegments.compute(blockId, (_, existing) => {
       val segments = if (existing == null) new ArrayBuffer[PartitionSegment]() else existing
@@ -280,7 +291,7 @@ class MultiBatchManagedBuffer(segments: Seq[PartitionSegment]) extends ManagedBu
       }
     }
 
-    buffer.flip()
+    buffer.asInstanceOf[Buffer].flip()
     buffer
   }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompLZ4CompressionCodec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompLZ4CompressionCodec.scala
index 1b7a2e2f285..136375996c2 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompLZ4CompressionCodec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompLZ4CompressionCodec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -68,7 +68,7 @@ class BatchedNvcompLZ4Compressor(maxBatchMemorySize: Long,
             table,
             CodecType.NVCOMP_LZ4,
             compressedSize)
-          CompressedTable(compressedSize, meta, buffer)
+          new CompressedTable(compressedSize, meta, buffer)
         }.toArray
       }
     }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompZSTDCompressionCodec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompZSTDCompressionCodec.scala
index 647a318d076..88f0be60e0f 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompZSTDCompressionCodec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvcompZSTDCompressionCodec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,8 +18,7 @@ package com.nvidia.spark.rapids
 
 import ai.rapids.cudf.{BaseDeviceMemoryBuffer, ContiguousTable, Cuda, DeviceMemoryBuffer}
 import ai.rapids.cudf.nvcomp.{BatchedZstdCompressor, BatchedZstdDecompressor}
-import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
-import com.nvidia.spark.rapids.RapidsPluginImplicits.AutoCloseableProducingArray
+import com.nvidia.spark.rapids.Arm.closeOnExcept
 import com.nvidia.spark.rapids.format.{BufferMeta, CodecType}
 
 /** A table compression codec that uses nvcomp's ZSTD-GPU codec */
@@ -59,7 +58,7 @@ class BatchedNvcompZSTDCompressor(maxBatchMemorySize: Long,
         compressedBufs.zip(tables).map { case (buffer, table) =>
           val compressedLen = buffer.getLength
           val meta = MetaUtils.buildTableMeta(None, table, CodecType.NVCOMP_ZSTD, compressedLen)
-          CompressedTable(compressedLen, meta, buffer)
+          new CompressedTable(compressedLen, meta, buffer)
         }.toArray
       }
     }
@@ -90,23 +89,3 @@ class BatchedNvcompZSTDDecompressor(maxBatchMemory: Long,
     outputBufs
   }
 }
-
-object DeviceBuffersUtils {
-  def incRefCount(bufs: Array[BaseDeviceMemoryBuffer]): Array[BaseDeviceMemoryBuffer] = {
-    bufs.safeMap { b =>
-      b.incRefCount()
-      b
-    }
-  }
-
-  def allocateBuffers(bufSizes: Array[Long]): Array[DeviceMemoryBuffer] = {
-    var curPos = 0L
-    withResource(DeviceMemoryBuffer.allocate(bufSizes.sum)) { singleBuf =>
-      bufSizes.safeMap { len =>
-        val ret = singleBuf.slice(curPos, len)
-        curPos += len
-        ret
-      }
-    }
-  }
-}
\ No newline at end of file
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxRangeWithDoc.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxRangeWithDoc.scala
index b700e917cca..7759d990439 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxRangeWithDoc.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxRangeWithDoc.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,18 +22,17 @@ import scala.collection.mutable
 
 import ai.rapids.cudf.{NvtxColor, NvtxRange}
 
-import org.apache.spark.internal.Logging
-
-object RangeDebugger extends Logging {
+object RangeDebugger {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
   val threadLocalStack = new ThreadLocal[mutable.ArrayStack[NvtxId]] {
     override def initialValue(): mutable.ArrayStack[NvtxId] = mutable.ArrayStack[NvtxId]()
   }
 
   private def dumpOrderErrorMessage(popped: Option[NvtxId], elem: NvtxId): Unit = {
-    logError(s"OUT OF ORDER POP of $elem")
-    logError(s"TOP OF STACK IS ${popped.getOrElse("<nil>")}")
+    log.error(s"OUT OF ORDER POP of $elem")
+    log.error(s"TOP OF STACK IS ${popped.getOrElse("<nil>")}")
     val stackTrace = Thread.currentThread.getStackTrace
-    stackTrace.foreach(elem => logError(elem.toString))
+    stackTrace.foreach(elem => log.error(elem.toString))
   }
 
   def push(elem: NvtxId): Unit = {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxWithMetrics.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxWithMetrics.scala
index ada85d211e8..d05ecaa576b 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxWithMetrics.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/NvtxWithMetrics.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -76,11 +76,11 @@ object NvtxIdWithMetrics {
   }
 }
 
-class MetricRange(val metrics: Seq[GpuMetric], val excludeMetric: Seq[GpuMetric] = Seq.empty)
+class MetricRange(val metrics: Seq[GpuMetric], val excludeMetric: Seq[GpuMetric])
   extends AutoCloseable {
 
   // add a convenient constructor
-  def this(metrics: GpuMetric*) = this(metrics.toSeq)
+  def this(metrics: GpuMetric*) = this(metrics.toSeq, Seq.empty)
 
   val needTracks = metrics.map(_.tryActivateTimer(excludeMetric))
   private val start = System.nanoTime()
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/Plugin.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/Plugin.scala
index 7aad76138b9..15706589dd7 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/Plugin.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/Plugin.scala
@@ -33,6 +33,8 @@ import com.nvidia.spark.rapids.RapidsConf.AllowMultipleJars
 import com.nvidia.spark.rapids.RapidsPluginUtils.buildInfoEvent
 import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 import com.nvidia.spark.rapids.filecache.{FileCache, FileCacheLocalityManager, FileCacheLocalityMsg}
+import com.nvidia.spark.rapids.fileio.RapidsInputFiles
+import com.nvidia.spark.rapids.fileio.hadoop.PerfIOS3Reader
 import com.nvidia.spark.rapids.io.async.TrafficController
 import com.nvidia.spark.rapids.jni.{GpuTimeZoneDB, Hash, JSONUtils, RmmSpark, TaskPriority}
 import com.nvidia.spark.rapids.python.PythonWorkerSemaphore
@@ -40,7 +42,6 @@ import org.apache.commons.lang3.exception.ExceptionUtils
 
 import org.apache.spark.{ExceptionFailure, SparkConf, SparkContext, TaskContext, TaskFailedReason}
 import org.apache.spark.api.plugin.{DriverPlugin, ExecutorPlugin, PluginContext, SparkPlugin}
-import org.apache.spark.internal.Logging
 import org.apache.spark.rapids.hybrid.HybridExecutionUtils
 import org.apache.spark.serializer.{JavaSerializer, KryoSerializer}
 import org.apache.spark.sql.catalyst.rules.Rule
@@ -51,9 +52,10 @@ import org.apache.spark.sql.rapids.execution.TrampolineUtil
 
 class PluginException(msg: String) extends RuntimeException(msg)
 
-case class CudfVersionMismatchException(errorMsg: String) extends PluginException(errorMsg)
+class CudfVersionMismatchException(val errorMsg: String)
+    extends PluginException(errorMsg) with Serializable
 
-case class ColumnarOverrideRules() extends ColumnarRule with Logging {
+class ColumnarOverrideRules extends ColumnarRule {
   lazy val overrides: Rule[SparkPlan] = GpuOverrides()
   lazy val overrideTransitions: Rule[SparkPlan] = new GpuTransitionOverrides()
 
@@ -62,7 +64,33 @@ case class ColumnarOverrideRules() extends ColumnarRule with Logging {
   override def postColumnarTransitions: Rule[SparkPlan] = overrideTransitions
 }
 
-object RapidsPluginUtils extends Logging {
+object RapidsPluginUtils {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logDebug(msg: => String, throwable: Throwable): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg, throwable)
+    }
+  }
+
   val CUDF_PROPS_FILENAME = "cudf-java-version-info.properties"
   val JNI_PROPS_FILENAME = "spark-rapids-jni-version-info.properties"
   val PLUGIN_PROPS_FILENAME = "rapids4spark-version-info.properties"
@@ -83,7 +111,7 @@ object RapidsPluginUtils extends Logging {
   private val SPARK_MASTER = "spark.master"
   private val SPARK_RAPIDS_REPO_URL = "https://github.com/NVIDIA/spark-rapids"
 
-  lazy val buildInfoEvent = SparkRapidsBuildInfoEvent(
+  lazy val buildInfoEvent = new SparkRapidsBuildInfoEvent(
     sparkRapidsBuildInfo = loadProps(PLUGIN_PROPS_FILENAME),
     sparkRapidsJniBuildInfo = loadProps(JNI_PROPS_FILENAME),
     cudfBuildInfo = loadProps(CUDF_PROPS_FILENAME),
@@ -441,12 +469,32 @@ object RapidsPluginUtils extends Logging {
 /**
  * The Spark driver plugin provided by the RAPIDS Spark plugin.
  */
-class RapidsDriverPlugin extends DriverPlugin with Logging {
+class RapidsDriverPlugin extends DriverPlugin {
   var rapidsShuffleHeartbeatManager: RapidsShuffleHeartbeatManager = null
   var shuffleCleanupListener: ShuffleCleanupListener = null
   private lazy val extraDriverPlugins =
     RapidsPluginUtils.extraPlugins.map(_.driverPlugin()).filterNot(_ == null)
 
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
   override def receive(msg: Any): AnyRef = {
     msg match {
       case m: FileCacheLocalityMsg =>
@@ -487,6 +535,7 @@ class RapidsDriverPlugin extends DriverPlugin with Logging {
   override def init(
     sc: SparkContext, pluginContext: PluginContext): java.util.Map[String, String] = {
     val sparkConf = pluginContext.conf
+    RapidsInputFiles.setS3PerfReader(PerfIOS3Reader.INSTANCE)
     RapidsPluginUtils.fixupConfigsOnDriver(sparkConf)
     val conf = new RapidsConf(sparkConf)
     RapidsPluginUtils.detectMultipleJars(conf)
@@ -564,10 +613,10 @@ class RapidsDriverPlugin extends DriverPlugin with Logging {
  * We store the object in concurrent map where the key is the executor task thread.
  * It is `AutoCloseable`, so the caller must close it on task success or failure.
  */
-case class ActiveTaskMetrics(
-    stageId: Int,
-    taskAttemptId: Long,
-    attemptNumber: Int) extends AutoCloseable {
+class ActiveTaskMetrics(
+    val stageId: Int,
+    val taskAttemptId: Long,
+    val attemptNumber: Int) extends AutoCloseable with Serializable {
   private var nvtx = new NvtxRange(
     s"Stage $stageId Task $taskAttemptId-$attemptNumber", NvtxColor.DARK_GREEN)
   private var closed = false
@@ -586,12 +635,50 @@ case class ActiveTaskMetrics(
 /**
  * The Spark executor plugin provided by the RAPIDS Spark plugin.
  */
-class RapidsExecutorPlugin extends ExecutorPlugin with Logging {
+class RapidsExecutorPlugin extends ExecutorPlugin {
   var rapidsShuffleHeartbeatEndpoint: RapidsShuffleHeartbeatEndpoint = null
   var shuffleCleanupEndpoint: ShuffleCleanupEndpoint = null
   private lazy val extraExecutorPlugins =
     RapidsPluginUtils.extraPlugins.map(_.executorPlugin()).filterNot(_ == null)
 
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg, throwable)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logError(msg: => String): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg)
+    }
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg, throwable)
+    }
+  }
+
   private val activeTaskInfo = new ConcurrentHashMap[Thread, ActiveTaskMetrics]()
 
   private var isAsyncProfilerEnabled = false
@@ -602,6 +689,7 @@ class RapidsExecutorPlugin extends ExecutorPlugin with Logging {
     try {
       // if configured, re-register checking leaks hook.
       reRegisterCheckLeakHook()
+      RapidsInputFiles.setS3PerfReader(PerfIOS3Reader.INSTANCE)
 
       val sparkConf = pluginContext.conf()
       val numCores = RapidsPluginUtils.estimateCoresOnExec(sparkConf)
@@ -738,16 +826,17 @@ class RapidsExecutorPlugin extends ExecutorPlugin with Logging {
   private def checkCudfVersion(conf: RapidsConf): Unit = {
     try {
       val expectedCudfVersion = buildInfoEvent.sparkRapidsBuildInfo.getOrElse("cudf_version",
-        throw CudfVersionMismatchException("Could not find cudf version in " +
+        throw new CudfVersionMismatchException("Could not find cudf version in " +
             RapidsPluginUtils.PLUGIN_PROPS_FILENAME))
 
       val cudfVersion = buildInfoEvent.cudfBuildInfo.getOrElse("version",
-        throw CudfVersionMismatchException("Could not find cudf version in " +
+        throw new CudfVersionMismatchException("Could not find cudf version in " +
             RapidsPluginUtils.CUDF_PROPS_FILENAME))
 
       // compare cudf version in the classpath with the cudf version expected by plugin
       if (!RapidsExecutorPlugin.cudfVersionSatisfied(expectedCudfVersion, cudfVersion)) {
-        throw CudfVersionMismatchException(s"Found cudf version $cudfVersion, RAPIDS Accelerator " +
+        throw new CudfVersionMismatchException(
+            s"Found cudf version $cudfVersion, RAPIDS Accelerator " +
             s"expects $expectedCudfVersion")
       }
     } catch {
@@ -877,7 +966,7 @@ class RapidsExecutorPlugin extends ExecutorPlugin with Logging {
     val attemptNumber = taskCtx.attemptNumber()
     activeTaskInfo.put(
       Thread.currentThread(),
-      ActiveTaskMetrics(stageId, taskAttemptId, attemptNumber))
+      new ActiveTaskMetrics(stageId, taskAttemptId, attemptNumber))
   }
 
   private def endTaskNvtx(): Unit = {
@@ -888,7 +977,27 @@ class RapidsExecutorPlugin extends ExecutorPlugin with Logging {
   }
 }
 
-object RapidsExecutorPlugin extends Logging {
+object RapidsExecutorPlugin {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg, throwable)
+    }
+  }
+
   /**
    * Calling System.exit will trigger shutdown hooks to run.
    * This code is intended to let them run, but then force
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/PrioritySemaphore.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/PrioritySemaphore.scala
index 393d18569c6..f6c61f2e2e2 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/PrioritySemaphore.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/PrioritySemaphore.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -33,11 +33,11 @@ class PrioritySemaphore[T](val maxPermits: Long, val maxConcurrentGpuTasksLimit:
   private var occupiedSlots: Long = 0
   private var currentConcurrentGpuTasksNum: Long = 0
 
-  private case class ThreadInfo(priority: T,
-                                condition: Condition,
-                                computeNumPermits: () => Long,
-                                wasOnGpuBefore: () => Boolean,
-                                taskId: Long) {
+  private class ThreadInfo(val priority: T,
+                           val condition: Condition,
+                           val computeNumPermits: () => Long,
+                           val wasOnGpuBefore: () => Boolean,
+                           val taskId: Long) {
     var signaled: Boolean = false
     var permitsUsed: Long = 0
   }
@@ -60,7 +60,7 @@ class PrioritySemaphore[T](val maxPermits: Long, val maxConcurrentGpuTasksLimit:
       if (waitingQueue.size() > 0 &&
         priorityComp.compare(
           waitingQueue.peek(),
-          ThreadInfo(priority, null, () => numPermits, wasOnGpuBefore, taskAttemptId)
+          new ThreadInfo(priority, null, () => numPermits, wasOnGpuBefore, taskAttemptId)
         ) < 0) {
         false
       } else if (!canAcquire(numPermits)) {
@@ -81,7 +81,8 @@ class PrioritySemaphore[T](val maxPermits: Long, val maxConcurrentGpuTasksLimit:
       val numPermitsNow = computePermits()
       if (!tryAcquire(numPermitsNow, priority, wasOnGpuBefore, taskAttemptId)) {
         val condition = lock.newCondition()
-        val info = ThreadInfo(priority, condition, computePermits, wasOnGpuBefore, taskAttemptId)
+        val info = new ThreadInfo(
+          priority, condition, computePermits, wasOnGpuBefore, taskAttemptId)
         try {
           waitingQueue.add(info)
           // only count tasks that had held semaphore before,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala
index 7021d62b18c..3bd3a920f09 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsConf.scala
@@ -27,7 +27,6 @@ import com.nvidia.spark.rapids.jni.kudo.DumpOption
 import com.nvidia.spark.rapids.lore.{LoreId, OutputLoreId}
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.Logging
 import org.apache.spark.network.util.{ByteUnit, JavaUtils}
 import org.apache.spark.sql.catalyst.analysis.FunctionRegistry
 import org.apache.spark.sql.internal.SQLConf
@@ -319,7 +318,19 @@ object RapidsReaderType extends Enumeration {
   val AUTO, COALESCING, MULTITHREADED, PERFILE = Value
 }
 
-object RapidsConf extends Logging {
+object RapidsConf {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
   val MULTITHREAD_READ_NUM_THREADS_DEFAULT = 20
 
   private val registeredConfs = new ListBuffer[ConfEntry[_]]()
@@ -3015,7 +3026,7 @@ val SHUFFLE_COMPRESSION_LZ4_CHUNK_SIZE = conf("spark.rapids.shuffle.compression.
       .createWithDefault(-1)
 
   // default value for the OOM injection logic (no injection, for regular operation)
-  private val noInjection = OomInjectionConf(
+  private val noInjection = new OomInjectionConf(
     numOoms = 0,
     skipCount = 0,
     oomInjectionFilter = OomInjectionType.CPU_OR_GPU,
@@ -3064,7 +3075,7 @@ val SHUFFLE_COMPRESSION_LZ4_CHUNK_SIZE = conf("spark.rapids.shuffle.compression.
       TEST_RETRY_OOM_INJECTION_MODE.get(SQLConf.get).toLowerCase match {
         case "false" => noInjection
         case "true" =>
-          OomInjectionConf(numOoms = 1, skipCount = 0,
+          new OomInjectionConf(numOoms = 1, skipCount = 0,
             oomInjectionFilter = OomInjectionType.CPU_OR_GPU, withSplit = false)
         case injectConfStr =>
           val injectConfMap = injectConfStr.split(',').map(_.split('=')).collect {
@@ -3077,7 +3088,7 @@ val SHUFFLE_COMPRESSION_LZ4_CHUNK_SIZE = conf("spark.rapids.shuffle.compression.
             .toUpperCase()
           val oomFilter = OomInjectionType.valueOf(oomFilterStr)
           val withSplit = injectConfMap.getOrElse("split", false.toString)
-          val ret = OomInjectionConf(
+          val ret = new OomInjectionConf(
             numOoms = numOoms.toInt,
             skipCount = skipCount.toInt,
             oomInjectionFilter = oomFilter,
@@ -3269,15 +3280,19 @@ val SHUFFLE_COMPRESSION_LZ4_CHUNK_SIZE = conf("spark.rapids.shuffle.compression.
     val buildSideSelection = JoinBuildSideSelection.withName(buildSideStr)
     val logCardinality = LOG_JOIN_CARDINALITY.get(conf)
     val sizeEstimateThreshold = JOIN_GATHERER_SIZE_ESTIMATE_THRESHOLD.get(conf)
-    JoinOptions(strategy, buildSideSelection, targetSize, logCardinality, sizeEstimateThreshold)
+    new JoinOptions(strategy, buildSideSelection, targetSize, logCardinality, sizeEstimateThreshold)
   }
 }
 
-class RapidsConf(conf: Map[String, String]) extends Logging {
+class RapidsConf(conf: Map[String, String]) {
 
   import ConfHelper._
   import RapidsConf._
 
+  private def logWarning(msg: => String): Unit = {
+    RapidsConf.logWarning(msg)
+  }
+
   def this(sqlConf: SQLConf) = {
     this(sqlConf.getAllConfs)
   }
@@ -3370,7 +3385,7 @@ class RapidsConf(conf: Map[String, String]) extends Logging {
     val buildSideSelection = JoinBuildSideSelection.withName(buildSideStr)
     val logCardinality = get(LOG_JOIN_CARDINALITY)
     val sizeEstimateThreshold = get(JOIN_GATHERER_SIZE_ESTIMATE_THRESHOLD)
-    JoinOptions(strategy, buildSideSelection, targetSize, logCardinality, sizeEstimateThreshold)
+    new JoinOptions(strategy, buildSideSelection, targetSize, logCardinality, sizeEstimateThreshold)
   }
 
   lazy val sizedJoinPartitionAmplification: Double = get(SIZED_JOIN_PARTITION_AMPLIFICATION)
@@ -4130,9 +4145,12 @@ class RapidsConf(conf: Map[String, String]) extends Logging {
   }
 }
 
-case class OomInjectionConf(
-  numOoms: Int,
-  skipCount: Int,
-  withSplit: Boolean,
-  oomInjectionFilter: OomInjectionType
-)
+class OomInjectionConf(
+    val numOoms: Int,
+    val skipCount: Int,
+    val withSplit: Boolean,
+    val oomInjectionFilter: OomInjectionType) extends Serializable {
+  override def toString: String =
+    "OomInjectionConf(" + numOoms + "," + skipCount + "," + withSplit + "," +
+        oomInjectionFilter + ")"
+}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsMeta.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsMeta.scala
index bc27d2af657..a654ab16658 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsMeta.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsMeta.scala
@@ -22,7 +22,7 @@ import scala.collection.mutable
 
 import com.nvidia.spark.rapids.GpuTypedImperativeSupportedAggregateExecMeta.{preRowToColProjection, readBufferConverter}
 import com.nvidia.spark.rapids.RapidsMeta.noNeedToReplaceReason
-import com.nvidia.spark.rapids.shims.{AggregateInPandasExecShims, DistributionUtil, SparkShimImpl}
+import com.nvidia.spark.rapids.shims.{DistributionUtil, SparkShimImpl}
 
 import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeReference, BinaryExpression, BoundReference, Cast, ComplexTypeMergingExpression, Expression, Literal, QuaternaryExpression, RuntimeReplaceable, String2TrimExpression, TernaryExpression, TimeZoneAwareExpression, UnaryExpression, UTCTimestamp, WindowExpression, WindowFunction}
 import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, AggregateFunction, ImperativeAggregate, TypedImperativeAggregate}
@@ -1029,15 +1029,49 @@ object ExpressionContext {
       case _ => None
     }
 
+  @transient private[this] lazy val sparkShimImplModule = {
+    Class.forName("com.nvidia.spark.rapids.shims.SparkShimImpl" + "$")
+      .getField("MODULE" + "$")
+      .get(null)
+  }
+
+  @transient private[this] lazy val isWindowFunctionExecMethod =
+    sparkShimImplModule.getClass.getMethod("isWindowFunctionExec", classOf[SparkPlan])
+
+  @transient private[this] lazy val aggregateInPandasExecShimsModule = {
+    Class.forName("com.nvidia.spark.rapids.shims.AggregateInPandasExecShims" + "$")
+      .getField("MODULE" + "$")
+      .get(null)
+  }
+
+  @transient private[this] lazy val isAggregateInPandasExecMethod =
+    aggregateInPandasExecShimsModule.getClass.getMethod("isAggregateInPandasExec",
+      classOf[SparkPlan])
+
+  @transient private[this] lazy val aggregateInPandasGroupingExpressionsMethod =
+    aggregateInPandasExecShimsModule.getClass.getMethod("getGroupingExpressions",
+      classOf[SparkPlan])
+
+  private def isWindowFunctionExec(plan: SparkPlan): Boolean =
+    isWindowFunctionExecMethod.invoke(sparkShimImplModule, plan).asInstanceOf[Boolean]
+
+  private def isAggregateInPandasExec(plan: SparkPlan): Boolean =
+    isAggregateInPandasExecMethod.invoke(aggregateInPandasExecShimsModule, plan)
+      .asInstanceOf[Boolean]
+
+  private def aggregateInPandasGroupingExpressions(plan: SparkPlan): Seq[_] =
+    aggregateInPandasGroupingExpressionsMethod.invoke(aggregateInPandasExecShimsModule, plan)
+      .asInstanceOf[Seq[_]]
+
   def getAggregateFunctionContext(meta: BaseExprMeta[_]): ExpressionContext = {
     val parent = findParentPlanMeta(meta)
     assert(parent.isDefined, "It is expected that an aggregate function is a child of a SparkPlan")
     parent.get.wrapped match {
-      case agg: SparkPlan if SparkShimImpl.isWindowFunctionExec(agg) =>
+      case agg: SparkPlan if isWindowFunctionExec(agg) =>
         WindowAggExprContext
       // AggregateInPandasExec renamed to ArrowAggregatePythonExec in Spark 4.1.0
-      case agg: SparkPlan if AggregateInPandasExecShims.isAggregateInPandasExec(agg) =>
-        if (AggregateInPandasExecShims.getGroupingExpressions(agg).isEmpty) {
+      case agg: SparkPlan if isAggregateInPandasExec(agg) =>
+        if (aggregateInPandasGroupingExpressions(agg).isEmpty) {
           ReductionAggExprContext
         } else {
           GroupByAggExprContext
@@ -1435,7 +1469,7 @@ abstract class BaseExprMeta[INPUT <: Expression](
     val inputMapping = scala.collection.mutable.Map[Int, Int]()
     
     gpuInputsWithIndex.foreach { case (gpuExpr, originalIndex) =>
-      val exprWrapper = GpuExpressionEquals(gpuExpr)
+      val exprWrapper = new GpuExpressionEquals(gpuExpr)
       seenExpressions.get(exprWrapper) match {
         case Some(existingIndex) =>
           // This expression is a duplicate - map to existing index
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsShuffleHeartbeatManager.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsShuffleHeartbeatManager.scala
index 598d9bd5447..d9098766085 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsShuffleHeartbeatManager.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RapidsShuffleHeartbeatManager.scala
@@ -26,12 +26,19 @@ import org.apache.commons.lang3.mutable.MutableLong
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.api.plugin.PluginContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.{ProxyRapidsShuffleInternalManagerBase, RapidsShuffleInternalManagerBase}
 import org.apache.spark.storage.BlockManagerId
 
 class RapidsShuffleHeartbeatManager(heartbeatIntervalMillis: Long,
-                                    heartbeatTimeoutMillis: Long) extends Logging {
+                                    heartbeatTimeoutMillis: Long) {
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[RapidsShuffleHeartbeatManager])
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
   require(heartbeatIntervalMillis > 0,
     s"The interval value: $heartbeatIntervalMillis ms is not > 0")
 
@@ -45,14 +52,18 @@ class RapidsShuffleHeartbeatManager(heartbeatIntervalMillis: Long,
   // exposed so that it can be mocked in the tests
   def getCurrentTimeMillis: Long = System.currentTimeMillis()
 
-  private case class ExecutorRegistration(
-      id: BlockManagerId,
+  private class ExecutorRegistration(
+      val id: BlockManagerId,
       // this is this executor's registration order, as given by this manager
-      registrationOrder: Long,
+      val registrationOrder: Long,
       // this is the last registration order this executor is aware of overall
-      lastRegistrationOrderSeen: MutableLong,
+      val lastRegistrationOrderSeen: MutableLong,
       // last heartbeat received from this executor in millis
-      lastHeartbeatMillis: MutableLong)
+      val lastHeartbeatMillis: MutableLong) {
+    override def toString: String =
+      s"ExecutorRegistration($id,$registrationOrder,$lastRegistrationOrderSeen," +
+        s"$lastHeartbeatMillis)"
+  }
 
   // a counter used to mark each new executor registration with an order
   var registrationOrder = 0L
@@ -82,7 +93,7 @@ class RapidsShuffleHeartbeatManager(heartbeatIntervalMillis: Long,
     require(!executorRegistrations.containsKey(id), s"Executor $id already registered")
     removeDeadExecutors(getCurrentTimeMillis)
     val allExecutors = executors.map(e => e.id).toArray
-    val newReg = ExecutorRegistration(id,
+    val newReg = new ExecutorRegistration(id,
       registrationOrder,
       new MutableLong(registrationOrder),
       new MutableLong(getCurrentTimeMillis))
@@ -167,7 +178,40 @@ class RapidsShuffleHeartbeatManager(heartbeatIntervalMillis: Long,
 }
 
 class RapidsShuffleHeartbeatEndpoint(pluginContext: PluginContext, conf: RapidsConf)
-  extends Logging with AutoCloseable {
+  extends AutoCloseable {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[RapidsShuffleHeartbeatEndpoint])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logTrace(msg: => String): Unit = {
+    if (log.isTraceEnabled) {
+      log.trace(msg)
+    }
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg, throwable)
+    }
+  }
+
   // Number of milliseconds between heartbeats to driver
   private[this] val heartbeatIntervalMillis =
     conf.shuffleTransportEarlyStartHeartbeatInterval
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RmmRapidsRetryIterator.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RmmRapidsRetryIterator.scala
index 25ec92937e1..98119619e19 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RmmRapidsRetryIterator.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/RmmRapidsRetryIterator.scala
@@ -31,9 +31,9 @@ import com.nvidia.spark.rapids.jni.{CpuRetryOOM, CpuSplitAndRetryOOM, GpuRetryOO
 import com.nvidia.spark.rapids.spill.SpillFramework
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 
-object RmmRapidsRetryIterator extends Logging {
+object RmmRapidsRetryIterator {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
 
   /**
    * withRetry for Iterator[T]. This helper calls a function `fn` as it takes
@@ -100,7 +100,7 @@ object RmmRapidsRetryIterator extends Logging {
       splitPolicy: T => Seq[T])
       (fn: T => K): Iterator[K] = {
     val attemptIter = new AutoCloseableAttemptSpliterator(
-      SingleItemAutoCloseableIteratorInternal(input), fn, splitPolicy)
+      new SingleItemAutoCloseableIteratorInternal(input), fn, splitPolicy)
     new RmmRapidsRetryAutoCloseableIterator(attemptIter)
   }
 
@@ -130,7 +130,7 @@ object RmmRapidsRetryIterator extends Logging {
       input: T)
       (fn: T => K): K = {
     val attemptIter = new AutoCloseableAttemptSpliterator(
-      SingleItemAutoCloseableIteratorInternal(input), fn)
+      new SingleItemAutoCloseableIteratorInternal(input), fn)
     drainSingleWithVerification(
       new RmmRapidsRetryAutoCloseableIterator(attemptIter))
   }
@@ -160,9 +160,9 @@ object RmmRapidsRetryIterator extends Logging {
   def withRetryNoSplit[T <: AutoCloseable, K](
       input: Seq[T])
       (fn: Seq[T] => K): K = {
-    val wrapped = AutoCloseableSeqInternal(input)
+    val wrapped = new AutoCloseableSeqInternal(input)
     val attemptIter = new AutoCloseableAttemptSpliterator(
-      SingleItemAutoCloseableIteratorInternal(wrapped), fn)
+      new SingleItemAutoCloseableIteratorInternal(wrapped), fn)
     drainSingleWithVerification(
       new RmmRapidsRetryAutoCloseableIterator(attemptIter))
   }
@@ -346,7 +346,7 @@ object RmmRapidsRetryIterator extends Logging {
    * @param ts the Seq to wrap
    * @tparam T the type of the items in `ts`
    */
-  private case class AutoCloseableSeqInternal[T <: AutoCloseable](ts: Seq[T])
+  private class AutoCloseableSeqInternal[T <: AutoCloseable](ts: Seq[T])
       extends Seq[T] with AutoCloseable {
     override def close(): Unit = {
       ts.foreach(_.safeClose())
@@ -375,7 +375,7 @@ object RmmRapidsRetryIterator extends Logging {
    * @param ts the AutoCloseable item to close if this iterator hasn't been drained
    * @tparam T the type of `ts`, must be AutoCloseable
    */
-  private case class SingleItemAutoCloseableIteratorInternal[T <: AutoCloseable](ts: T)
+  private class SingleItemAutoCloseableIteratorInternal[T <: AutoCloseable](ts: T)
       extends Iterator[T] with AutoCloseable {
 
     private var wasCalledSuccessfully = false
@@ -754,7 +754,7 @@ object RmmRapidsRetryIterator extends Logging {
               } else {
                 splitReason = SplitReason.CPU_OOM
               }
-              logInfo("splitReason is set " +
+              log.info("splitReason is set " +
                 s"to ${splitReason} after checking isRetryOrSplitAndRetry, related exception:",
                 ex)
             }
@@ -773,7 +773,7 @@ object RmmRapidsRetryIterator extends Logging {
                   }
                 }
                 if (splitReason == SplitReason.GPU_OOM || splitReason == SplitReason.CPU_OOM) {
-                  logInfo(s"splitReason is set to ${splitReason} after checking " +
+                  log.info(s"splitReason is set to ${splitReason} after checking " +
                     s"causedByRetryOrSplit, related exception:", ex)
                 }
               }
@@ -791,7 +791,7 @@ object RmmRapidsRetryIterator extends Logging {
               if (isOrCausedByColumnSizeOverflow(ex)) {
                 // CUDF column size overflow? Attempt split-retry.
                 splitReason = SplitReason.CUDF_OVERFLOW
-                logInfo(s"splitReason is set to ${splitReason} after checking " +
+                log.info(s"splitReason is set to ${splitReason} after checking " +
                   s"isOrCausedByColumnSizeOverflow, related exception:", ex)
               } else {
                 // we want to throw early here, since we got an exception
@@ -879,7 +879,7 @@ object RmmRapidsRetryIterator extends Logging {
                 s" minimum: ${target.minSize}")
         }
       }
-      Seq(AutoCloseableTargetSize(newTarget, target.minSize, target.dataSize))
+      Seq(new AutoCloseableTargetSize(newTarget, target.minSize, target.dataSize))
     }
   }
 
@@ -937,8 +937,8 @@ object RmmRapidsRetryIterator extends Logging {
 
   private def logSpillFrameworkSummary(): Unit = {
     // print spillable status
-    logInfo(SpillFramework.getHostStoreSpillableSummary)
-    logInfo(SpillFramework.getDeviceStoreSpillableSummary)
+    log.info(SpillFramework.getHostStoreSpillableSummary)
+    log.info(SpillFramework.getDeviceStoreSpillableSummary)
   }
 
   // For GPU/CPU SplitAndRetryOOM, we are very interested what each task is doing when one
@@ -956,12 +956,12 @@ object RmmRapidsRetryIterator extends Logging {
       }
       sb.append("\n\n")
     })
-    logInfo(sb.toString())
+    log.info(sb.toString())
   }
 
   private def logMemoryBookkeeping(): Unit = { // use synchronized to keep neat
     // print host memory bookkeeping
-    logInfo(HostAlloc.getHostAllocBookkeepSummary())
+    log.info(HostAlloc.getHostAllocBookkeepSummary())
 
     // print device memory bookkeeping
     // TODO: uncomment this once we have device memory bookkeeping in spark-rapids-jni
@@ -976,12 +976,6 @@ object RmmRapidsRetryIterator extends Logging {
  * `CpuSplitAndRetryOOM`, a split policy like `splitTargetSizeInHalfGpu` or
  * `splitTargetSizeInHalfCpu` can be used to retry the block with a smaller target size.
  */
-case class AutoCloseableTargetSize(targetSize: Long, minSize: Long,
-    dataSize: Long = 0) extends AutoCloseable {
-  def this(targetSize: Long, minSize: Long) = this(targetSize, minSize, 0)
-  override def close(): Unit = ()
-}
-
 /**
  * This leverages a ThreadLocal of boolean to track if a task thread is currently
  * executing a retry. And the boolean state will be used by all the
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleBufferCatalog.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleBufferCatalog.scala
index 2dee040dad7..d7dab6f58c5 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleBufferCatalog.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleBufferCatalog.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,22 +28,21 @@ import com.nvidia.spark.rapids.format.TableMeta
 import com.nvidia.spark.rapids.spill.{SpillableDeviceBufferHandle, SpillableHandle}
 
 import org.apache.spark.{SparkEnv, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.sql.types.DataType
 import org.apache.spark.sql.vectorized.ColumnarBatch
 import org.apache.spark.storage.ShuffleBlockId
 
-/** Identifier for a shuffle buffer that holds the data for a table */
-case class ShuffleBufferId(
-    blockId: ShuffleBlockId,
-    tableId: Int) {
-  val shuffleId: Int = blockId.shuffleId
-  val mapId: Long = blockId.mapId
-}
-
 /** Catalog for lookup of shuffle buffers by block ID */
-class ShuffleBufferCatalog extends Logging {
+class ShuffleBufferCatalog {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
   /**
    * Information stored for each active shuffle.
    * A shuffle block can be comprised of multiple batches. Each batch
@@ -259,7 +258,7 @@ class ShuffleBufferCatalog extends Logging {
     }
 
     val tableId = tableIdCounter.getAndUpdate(ShuffleBufferCatalog.TABLE_ID_UPDATER)
-    val id = ShuffleBufferId(blockId, tableId)
+    val id = new ShuffleBufferId(blockId, tableId)
     val prev = tableMap.put(tableId, id)
     if (prev != null) {
       throw new IllegalStateException(s"table ID $tableId is already in use")
@@ -283,7 +282,7 @@ class ShuffleBufferCatalog extends Logging {
     val (maybeHandle, meta) = bufferIdToHandle.get(shuffleBufferId)
     maybeHandle match {
       case Some(spillable) =>
-        RapidsShuffleHandle(spillable, meta)
+        new RapidsShuffleHandle(spillable, meta)
       case None =>
         throw new IllegalStateException(
           "a buffer handle could not be obtained for a degenerate buffer")
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupEndpoint.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupEndpoint.scala
index a7b6e065354..cb65d3764fa 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupEndpoint.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupEndpoint.scala
@@ -23,7 +23,6 @@ import scala.collection.mutable.ArrayBuffer
 import com.nvidia.spark.rapids.jni.RmmSpark
 
 import org.apache.spark.api.plugin.PluginContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.GpuShuffleEnv
 
 /**
@@ -38,7 +37,40 @@ import org.apache.spark.sql.rapids.GpuShuffleEnv
  */
 class ShuffleCleanupEndpoint(
     pluginContext: PluginContext,
-    pollIntervalMs: Long = 1000) extends Logging with AutoCloseable {
+    pollIntervalMs: Long = 1000) extends AutoCloseable {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[ShuffleCleanupEndpoint])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg, throwable)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logTrace(msg: => String): Unit = {
+    if (log.isTraceEnabled) {
+      log.trace(msg)
+    }
+  }
+
 
   private val executorId: String = pluginContext.executorID()
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupManager.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupManager.scala
index ef90caee02d..839851a4cf5 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupManager.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleCleanupManager.scala
@@ -22,7 +22,6 @@ import java.util.concurrent.{ConcurrentHashMap, Executors, ScheduledExecutorServ
 import scala.collection.mutable.ArrayBuffer
 
 import org.apache.spark.SparkContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 
 /**
@@ -89,7 +88,33 @@ class ShuffleCleanupManager(
     sc: SparkContext,
     staleEntryMaxAgeMs: Long = 300000,  // 5 minutes
     cleanupIntervalMs: Long = 60000     // 1 minute
-) extends Logging {
+) {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[ShuffleCleanupManager])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg, throwable)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
 
   /**
    * Shuffles pending cleanup. Maps shuffleId -> timestamp when unregister was called.
@@ -192,8 +217,13 @@ class ShuffleCleanupManager(
 
         try {
           TrampolineUtil.postEvent(sc,
-            SparkRapidsShuffleDiskSavingsEvent(shuffleId, stat.bytesFromMemory, stat.bytesFromDisk,
-              stat.numExpansions, stat.numSpills, stat.numForcedFileOnly))
+            new SparkRapidsShuffleDiskSavingsEvent(
+              shuffleId,
+              stat.bytesFromMemory,
+              stat.bytesFromDisk,
+              stat.numExpansions,
+              stat.numSpills,
+              stat.numForcedFileOnly))
         } catch {
           case e: Exception =>
             logWarning(s"Failed to post shuffle disk savings event for shuffle $shuffleId", e)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleReceivedBufferCatalog.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleReceivedBufferCatalog.scala
index 450622ef3ba..513e779098f 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleReceivedBufferCatalog.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ShuffleReceivedBufferCatalog.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,19 +22,19 @@ import com.nvidia.spark.rapids.RapidsPluginImplicits.AutoCloseableColumn
 import com.nvidia.spark.rapids.format.TableMeta
 import com.nvidia.spark.rapids.spill.SpillableDeviceBufferHandle
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.types.DataType
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-case class RapidsShuffleHandle(
-    spillable: SpillableDeviceBufferHandle, tableMeta: TableMeta) extends AutoCloseable {
+class RapidsShuffleHandle(
+    val spillable: SpillableDeviceBufferHandle,
+    val tableMeta: TableMeta) extends AutoCloseable with Serializable {
   override def close(): Unit = {
     spillable.safeClose()
   }
 }
 
 /** Catalog for lookup of shuffle buffers by block ID */
-class ShuffleReceivedBufferCatalog() extends Logging {
+class ShuffleReceivedBufferCatalog() {
 
   /**
    * Adds a buffer to the device storage, taking ownership of the buffer.
@@ -52,7 +52,7 @@ class ShuffleReceivedBufferCatalog() extends Logging {
       buffer: DeviceMemoryBuffer,
       tableMeta: TableMeta,
       initialSpillPriority: Long): RapidsShuffleHandle = {
-    RapidsShuffleHandle(SpillableDeviceBufferHandle(buffer), tableMeta)
+    new RapidsShuffleHandle(SpillableDeviceBufferHandle(buffer), tableMeta)
   }
 
   /**
@@ -62,7 +62,7 @@ class ShuffleReceivedBufferCatalog() extends Logging {
    * @return RapidsShuffleHandle associated with this buffer
    */
   def addDegenerateBatch(meta: TableMeta): RapidsShuffleHandle  = {
-    RapidsShuffleHandle(null, meta)
+    new RapidsShuffleHandle(null, meta)
   }
 
   def getColumnarBatchAndRemove(handle: RapidsShuffleHandle,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SortUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SortUtils.scala
index 8203cefdadd..ac25584833d 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SortUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SortUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -413,7 +413,7 @@ class GpuSorter(
   }
 }
 
-case class GpuSortOrderMeta(
+class GpuSortOrderMeta(
    sortOrder: SortOrder,
    override val conf: RapidsConf,
    parentOpt: Option[RapidsMeta[_, _, _]],
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SpillPriorities.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SpillPriorities.scala
deleted file mode 100644
index 9c82f71c469..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SpillPriorities.scala
+++ /dev/null
@@ -1,70 +0,0 @@
-/*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-/**
- * Utility methods for managing spillable buffer priorities.
- * The spill priority numerical space is divided into potentially overlapping
- * ranges based on the type of buffer.
- */
-object SpillPriorities {
-  /**
-   * Priorities for task output buffers intended for shuffle.
-   */
-  val OUTPUT_FOR_SHUFFLE_INITIAL_TASK_PRIORITY: Long = Long.MinValue
-
-  /**
-   * Priorities for buffers received from shuffle.
-   * Shuffle input buffers are about to be read by a task, so spill
-   * them if there's no other choice, but leave some space at the end of the priority range
-   * so there can be some things after it.
-   */
-  val INPUT_FROM_SHUFFLE_PRIORITY: Long = Long.MaxValue - 1000
-
-  /**
-   * Priority for buffers that are waiting for next to be called.  i.e. data held between
-   * calls to `hasNext` and `next` or between different calls to `next`.
-   */
-  val ACTIVE_ON_DECK_PRIORITY: Long = INPUT_FROM_SHUFFLE_PRIORITY + 1
-
-  /**
-   * Priority for multiple buffers being buffered within a call to next.
-   */
-  val ACTIVE_BATCHING_PRIORITY: Long = ACTIVE_ON_DECK_PRIORITY + 100
-
-  /**
-   * Priority offset for host memory buffers for spilling.
-   */
-  val HOST_MEMORY_BUFFER_SPILL_OFFSET: Long = 0
-
-  /**
-   * Calculate a new priority based on an offset, clamping it to avoid wraparound.
-   *
-   * @param originalPriority the original priority
-   * @param offset           the desired offset
-   * @return the resulting priority, with clamping if needed
-   */
-  def applyPriorityOffset(originalPriority: Long, offset: Long): Long = {
-    if (offset < 0 && originalPriority < Long.MinValue - offset) {
-      Long.MinValue
-    } else if (offset > 0 && originalPriority > Long.MaxValue - offset) {
-      Long.MaxValue
-    } else {
-      originalPriority + offset
-    }
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SpillableKudoTable.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SpillableKudoTable.scala
deleted file mode 100644
index 5bba5169de2..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/SpillableKudoTable.scala
+++ /dev/null
@@ -1,59 +0,0 @@
-/*
- * Copyright (c) 2025, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-package com.nvidia.spark.rapids
-
-import ai.rapids.cudf.HostMemoryBuffer
-import com.nvidia.spark.rapids.jni.kudo.KudoTable
-import com.nvidia.spark.rapids.jni.kudo.KudoTableHeader
-
-
-class SpillableKudoTable(val header: KudoTableHeader,
-    val length: Long,
-    shb: SpillableHostBuffer)
-  extends AutoCloseable {
-
-  def makeKudoTable: KudoTable = {
-    if (shb == null) {
-      new KudoTable(header, null)
-    } else {
-      new KudoTable(header, shb.getHostBuffer())
-    }
-  }
-
-  override def toString: String =
-    "SpillableKudoTable{header=" + this.header + ", shb=" + this.shb + '}'
-
-  override def close(): Unit = {
-    if (shb != null) shb.close()
-  }
-}
-
-object SpillableKudoTable {
-  def apply(header: KudoTableHeader, buffer: HostMemoryBuffer): SpillableKudoTable = {
-    if (buffer == null) {
-      new SpillableKudoTable(header, 0, null)
-    } else {
-      new SpillableKudoTable(
-        header,
-        buffer.getLength,
-        SpillableHostBuffer.apply(
-          buffer,
-          buffer.getLength,
-          SpillPriorities.ACTIVE_BATCHING_PRIORITY)
-      )
-    }
-  }
-}
\ No newline at end of file
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TableCompressionCodec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TableCompressionCodec.scala
index 1c45b31b986..09b04d0e8f3 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TableCompressionCodec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TableCompressionCodec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,22 +21,7 @@ import scala.collection.mutable.ArrayBuffer
 import ai.rapids.cudf.{BaseDeviceMemoryBuffer, ContiguousTable, Cuda, DeviceMemoryBuffer}
 import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.RapidsPluginImplicits._
-import com.nvidia.spark.rapids.format.{BufferMeta, CodecType, TableMeta}
-
-import org.apache.spark.internal.Logging
-
-/**
- * Compressed table descriptor
- * @param compressedSize size of the compressed data in bytes
- * @param meta metadata describing the table layout when uncompressed
- * @param buffer buffer containing the compressed data
- */
-case class CompressedTable(
-    compressedSize: Long,
-    meta: TableMeta,
-    buffer: DeviceMemoryBuffer) extends AutoCloseable {
-  override def close(): Unit = buffer.close()
-}
+import com.nvidia.spark.rapids.format.{BufferMeta, CodecType}
 
 /** An interface to a compression codec that can compress a contiguous Table on the GPU */
 trait TableCompressionCodec {
@@ -71,12 +56,15 @@ trait TableCompressionCodec {
       stream: Cuda.Stream): BatchedBufferDecompressor
 }
 
-/**
- * A small case class used to carry codec-specific settings.
- */
-case class TableCompressionCodecConfig(lz4ChunkSize: Long, zstdChunkSize: Long)
+object TableCompressionCodec {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
 
-object TableCompressionCodec extends Logging {
   private val codecNameToId = Map(
     "copy" -> CodecType.COPY,
     "zstd" -> CodecType.NVCOMP_ZSTD,
@@ -84,7 +72,7 @@ object TableCompressionCodec extends Logging {
 
   /** Make a codec configuration object which can be serialized (can be used in tasks) */
   def makeCodecConfig(rapidsConf: RapidsConf): TableCompressionCodecConfig =
-    TableCompressionCodecConfig(
+    new TableCompressionCodecConfig(
       rapidsConf.shuffleCompressionLz4ChunkSize,
       rapidsConf.shuffleCompressionZstdChunkSize)
 
@@ -117,7 +105,15 @@ object TableCompressionCodec extends Logging {
  * @param stream CUDA stream to use
  */
 abstract class BatchedTableCompressor(maxBatchMemorySize: Long, stream: Cuda.Stream)
-    extends AutoCloseable with Logging {
+    extends AutoCloseable {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
   // The tables that need to be compressed in the next batch
   private[this] val tables = new ArrayBuffer[ContiguousTable]
 
@@ -237,7 +233,7 @@ abstract class BatchedTableCompressor(maxBatchMemorySize: Long, stream: Cuda.Str
             ct.buffer.incRefCount()
             ct.buffer
           }
-          CompressedTable(ct.compressedSize, ct.meta, newBuffer)
+          new CompressedTable(ct.compressedSize, ct.meta, newBuffer)
         }
       }
     }
@@ -262,7 +258,15 @@ abstract class BatchedTableCompressor(maxBatchMemorySize: Long, stream: Cuda.Str
  * @param stream CUDA stream to use
  */
 abstract class BatchedBufferDecompressor(maxBatchMemorySize: Long, stream: Cuda.Stream)
-    extends AutoCloseable with Logging {
+    extends AutoCloseable {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
   // The buffers of compressed data that will be decompressed in the next batch
   private[this] val inputBuffers = new ArrayBuffer[BaseDeviceMemoryBuffer]
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ThreadFactoryBuilder.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ThreadFactoryBuilder.scala
deleted file mode 100644
index d61dd5a9c90..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/ThreadFactoryBuilder.scala
+++ /dev/null
@@ -1,52 +0,0 @@
-/*
- * Copyright (c) 2022, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids
-
-import java.util.concurrent.{Executors, ThreadFactory}
-import java.util.concurrent.atomic.AtomicLong
-
-// This is similar to Guava ThreadFactoryBuilder
-// Avoid to use Guava as it is a messy dependency in practice.
-class ThreadFactoryBuilder {
-  private var nameFormat = Option.empty[String]
-  private var daemon = Option.empty[Boolean]
-
-  def setNameFormat(nameFormat: String): ThreadFactoryBuilder = {
-    nameFormat.format(0)
-    this.nameFormat = Some(nameFormat)
-    this
-  }
-
-  def setDaemon(daemon: Boolean): ThreadFactoryBuilder = {
-    this.daemon = Some(daemon)
-    this
-  }
-
-  def build(): ThreadFactory = {
-    val count = nameFormat.map(_ => new AtomicLong(0))
-    new ThreadFactory() {
-      private val defaultThreadFactory = Executors.defaultThreadFactory
-
-      override def newThread(r: Runnable): Thread = {
-        val thread = defaultThreadFactory.newThread(r)
-        nameFormat.foreach(f => thread.setName(f.format(count.get.getAndIncrement())))
-        daemon.foreach(b => thread.setDaemon(b))
-        thread
-      }
-    }
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TypeChecks.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TypeChecks.scala
index 18055111ee4..13622d07c44 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TypeChecks.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/TypeChecks.scala
@@ -746,30 +746,33 @@ abstract class TypeChecks[RET] {
 /**
  * Checks a set of named inputs to an SparkPlan node against a TypeSig
  */
-case class InputCheck(cudf: TypeSig, spark: TypeSig, notes: List[String] = List.empty)
+class InputCheck(val cudf: TypeSig, val spark: TypeSig, val notes: List[String])
+    extends Serializable
 
 /**
  * Checks a single parameter by position against a TypeSig
  */
-case class ParamCheck(name: String, cudf: TypeSig, spark: TypeSig)
+class ParamCheck(val name: String, val cudf: TypeSig, val spark: TypeSig)
+    extends Serializable
 
 /**
  * Checks the type signature for a parameter that repeats (Can only be used at the end of a list
  * of position parameters)
  */
-case class RepeatingParamCheck(name: String, cudf: TypeSig, spark: TypeSig)
+class RepeatingParamCheck(val name: String, val cudf: TypeSig, val spark: TypeSig)
+    extends Serializable
 
 /**
  * Checks an expression that have input parameters and a single output.  This is intended to be
  * given for a specific ExpressionContext. If your expression does not meet this pattern you may
  * need to create a custom ExprChecks instance.
  */
-case class ContextChecks(
-    outputCheck: TypeSig,
-    sparkOutputSig: TypeSig,
-    paramCheck: Seq[ParamCheck] = Seq.empty,
-    repeatingParamCheck: Option[RepeatingParamCheck] = None)
-    extends TypeChecks[Map[String, SupportLevel]] {
+class ContextChecks(
+    val outputCheck: TypeSig,
+    val sparkOutputSig: TypeSig,
+    val paramCheck: Seq[ParamCheck],
+    val repeatingParamCheck: Option[RepeatingParamCheck])
+    extends TypeChecks[Map[String, SupportLevel]] with Serializable {
 
   def tagAst(exprMeta: BaseExprMeta[_]): Unit = {
     tagBase(exprMeta, exprMeta.willNotWorkInAst)
@@ -965,10 +968,10 @@ object ExecChecks {
  */
 abstract class PartChecks extends TypeChecks[Map[String, SupportLevel]]
 
-case class PartChecksImpl(
-    paramCheck: Seq[ParamCheck] = Seq.empty,
-    repeatingParamCheck: Option[RepeatingParamCheck] = None)
-    extends PartChecks {
+class PartChecksImpl(
+    val paramCheck: Seq[ParamCheck],
+    val repeatingParamCheck: Option[RepeatingParamCheck])
+    extends PartChecks with Serializable {
 
   override def tag(meta: RapidsMeta[_, _, _]): Unit = {
     val part = meta.wrapped
@@ -1005,9 +1008,9 @@ case class PartChecksImpl(
 
 object PartChecks {
   def apply(repeatingParamCheck: RepeatingParamCheck): PartChecks =
-    PartChecksImpl(Seq.empty, Some(repeatingParamCheck))
+    new PartChecksImpl(Seq.empty, Some(repeatingParamCheck))
 
-  def apply(): PartChecks = PartChecksImpl()
+  def apply(): PartChecks = new PartChecksImpl(Seq.empty, None)
 }
 
 /**
@@ -1020,7 +1023,7 @@ abstract class ExprChecks extends TypeChecks[Map[ExpressionContext, Map[String,
   def tagAst(meta: BaseExprMeta[_]): Unit
 }
 
-case class ExprChecksImpl(contexts: Map[ExpressionContext, ContextChecks])
+class ExprChecksImpl(val contexts: Map[ExpressionContext, ContextChecks])
     extends ExprChecks {
   override def tag(meta: RapidsMeta[_, _, _]): Unit = {
     val exprMeta = meta.asInstanceOf[BaseExprMeta[_]]
@@ -1499,9 +1502,9 @@ object ExprChecks {
       sparkOutputSig: TypeSig,
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks =
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (ProjectExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
 
   /**
    * A check for an expression that supports project and as much of AST as it can.
@@ -1514,16 +1517,16 @@ object ExprChecks {
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks = {
     val astOutputCheck = outputCheck.intersect(allowedAstTypes)
     val astParamCheck = paramCheck.map { pc =>
-      ParamCheck(pc.name, pc.cudf.intersect(allowedAstTypes), pc.spark)
+      new ParamCheck(pc.name, pc.cudf.intersect(allowedAstTypes), pc.spark)
     }
     val astRepeatingParamCheck = repeatingParamCheck.map { rpc =>
-      RepeatingParamCheck(rpc.name, rpc.cudf.intersect(allowedAstTypes), rpc.spark)
+      new RepeatingParamCheck(rpc.name, rpc.cudf.intersect(allowedAstTypes), rpc.spark)
     }
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       ProjectExprContext ->
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck),
       AstExprContext ->
-          ContextChecks(astOutputCheck, sparkOutputSig, astParamCheck, astRepeatingParamCheck)
+          new ContextChecks(astOutputCheck, sparkOutputSig, astParamCheck, astRepeatingParamCheck)
     ))
   }
 
@@ -1536,7 +1539,7 @@ object ExprChecks {
       inputCheck: TypeSig,
       sparkInputSig: TypeSig): ExprChecks =
     projectOnly(outputCheck, sparkOutputSig,
-      Seq(ParamCheck("input", inputCheck, sparkInputSig)))
+      Seq(new ParamCheck("input", inputCheck, sparkInputSig)))
 
   /**
    * A check for a unary expression that supports project and as much AST as it can.
@@ -1548,7 +1551,7 @@ object ExprChecks {
       inputCheck: TypeSig,
       sparkInputSig: TypeSig): ExprChecks =
     projectAndAst(allowedAstTypes, outputCheck, sparkOutputSig,
-      Seq(ParamCheck("input", inputCheck, sparkInputSig)))
+      Seq(new ParamCheck("input", inputCheck, sparkInputSig)))
 
   /**
    * Unary expression checks for project where the input matches the output.
@@ -1587,8 +1590,8 @@ object ExprChecks {
       param1: (String, TypeSig, TypeSig),
       param2: (String, TypeSig, TypeSig)): ExprChecks =
     projectOnly(outputCheck, sparkOutputSig,
-      Seq(ParamCheck(param1._1, param1._2, param1._3),
-        ParamCheck(param2._1, param2._2, param2._3)))
+      Seq(new ParamCheck(param1._1, param1._2, param1._3),
+        new ParamCheck(param2._1, param2._2, param2._3)))
 
   /**
    * Helper function for a binary expression where the plugin supports project and AST.
@@ -1600,8 +1603,8 @@ object ExprChecks {
       param1: (String, TypeSig, TypeSig),
       param2: (String, TypeSig, TypeSig)): ExprChecks =
     projectAndAst(allowedAstTypes, outputCheck, sparkOutputSig,
-      Seq(ParamCheck(param1._1, param1._2, param1._3),
-        ParamCheck(param2._1, param2._2, param2._3)))
+      Seq(new ParamCheck(param1._1, param1._2, param1._3),
+        new ParamCheck(param2._1, param2._2, param2._3)))
 
   /**
    * Aggregate operation where only group by agg and reduction is supported in the plugin and in
@@ -1612,11 +1615,11 @@ object ExprChecks {
       sparkOutputSig: TypeSig,
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks =
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (GroupByAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (ReductionAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
 
   /**
    * Aggregate operation where window, reduction, and group by agg are all supported the same.
@@ -1626,13 +1629,13 @@ object ExprChecks {
       sparkOutputSig: TypeSig,
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks =
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (GroupByAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (ReductionAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (WindowAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
 
   /**
    * For a generic expression that can work as both an aggregation and in the project context.
@@ -1643,15 +1646,15 @@ object ExprChecks {
       sparkOutputSig: TypeSig,
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks =
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (GroupByAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (ReductionAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (WindowAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (ProjectExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
 
   /**
    * An aggregation check where group by and reduction are supported by the plugin, but Spark
@@ -1663,18 +1666,18 @@ object ExprChecks {
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks = {
     val windowParamCheck = paramCheck.map { pc =>
-      ParamCheck(pc.name, TypeSig.none, pc.spark)
+      new ParamCheck(pc.name, TypeSig.none, pc.spark)
     }
     val windowRepeat = repeatingParamCheck.map { pc =>
-      RepeatingParamCheck(pc.name, TypeSig.none, pc.spark)
+      new RepeatingParamCheck(pc.name, TypeSig.none, pc.spark)
     }
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (GroupByAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (ReductionAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (WindowAggExprContext,
-          ContextChecks(TypeSig.none, sparkOutputSig, windowParamCheck, windowRepeat))))
+          new ContextChecks(TypeSig.none, sparkOutputSig, windowParamCheck, windowRepeat))))
   }
 
   /**
@@ -1686,9 +1689,9 @@ object ExprChecks {
       sparkOutputSig: TypeSig,
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks =
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (WindowAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
 
 
   /**
@@ -1701,18 +1704,18 @@ object ExprChecks {
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks = {
     val noneParamCheck = paramCheck.map { pc =>
-      ParamCheck(pc.name, TypeSig.none, pc.spark)
+      new ParamCheck(pc.name, TypeSig.none, pc.spark)
     }
     val noneRepeatCheck = repeatingParamCheck.map { pc =>
-      RepeatingParamCheck(pc.name, TypeSig.none, pc.spark)
+      new RepeatingParamCheck(pc.name, TypeSig.none, pc.spark)
     }
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (ReductionAggExprContext,
-        ContextChecks(TypeSig.none, sparkOutputSig, noneParamCheck, noneRepeatCheck)),
+        new ContextChecks(TypeSig.none, sparkOutputSig, noneParamCheck, noneRepeatCheck)),
       (GroupByAggExprContext,
-        ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+        new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (WindowAggExprContext,
-        ContextChecks(TypeSig.none, sparkOutputSig, noneParamCheck, noneRepeatCheck))))
+        new ContextChecks(TypeSig.none, sparkOutputSig, noneParamCheck, noneRepeatCheck))))
   }
 
   /**
@@ -1725,18 +1728,18 @@ object ExprChecks {
       paramCheck: Seq[ParamCheck] = Seq.empty,
       repeatingParamCheck: Option[RepeatingParamCheck] = None): ExprChecks = {
     val noneParamCheck = paramCheck.map { pc =>
-      ParamCheck(pc.name, TypeSig.none, pc.spark)
+      new ParamCheck(pc.name, TypeSig.none, pc.spark)
     }
     val noneRepeatCheck = repeatingParamCheck.map { pc =>
-      RepeatingParamCheck(pc.name, TypeSig.none, pc.spark)
+      new RepeatingParamCheck(pc.name, TypeSig.none, pc.spark)
     }
-    ExprChecksImpl(Map(
+    new ExprChecksImpl(Map(
       (ReductionAggExprContext,
-          ContextChecks(TypeSig.none, sparkOutputSig, noneParamCheck, noneRepeatCheck)),
+          new ContextChecks(TypeSig.none, sparkOutputSig, noneParamCheck, noneRepeatCheck)),
       (GroupByAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck)),
       (WindowAggExprContext,
-          ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
+          new ContextChecks(outputCheck, sparkOutputSig, paramCheck, repeatingParamCheck))))
   }
 }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/VersionUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/VersionUtils.scala
index 929abfed832..3f36ca48fc8 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/VersionUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/VersionUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,9 +18,14 @@ package com.nvidia.spark.rapids
 
 import com.nvidia.spark.rapids.jni.{SparkPlatformType => PlatformForJni, Version => VersionForJni}
 
-import org.apache.spark.internal.Logging
 
-object VersionUtils extends Logging {
+object VersionUtils {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
 
   lazy val isSpark320OrLater: Boolean = cmpSparkVersion(3, 2, 0) >= 0
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/asyncProfiler.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/asyncProfiler.scala
index 1cd6f625909..75bdab0b7e1 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/asyncProfiler.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/asyncProfiler.scala
@@ -30,7 +30,6 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.TaskContext
 import org.apache.spark.api.plugin.PluginContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.util.SerializableConfiguration
 
 /**
@@ -55,7 +54,9 @@ import org.apache.spark.util.SerializableConfiguration
  *
  */
 
-object AsyncProfilerOnExecutor extends Logging {
+object AsyncProfilerOnExecutor {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(AsyncProfilerOnExecutor.getClass)
 
   private var asyncProfilerPrefix: Option[String] = None
   private var asyncProfiler: Option[AsyncProfiler] = None
@@ -347,7 +348,7 @@ object AsyncProfilerOnExecutor extends Logging {
               val outPath = new Path(asyncProfilerPrefix.get, 
                 if (jfrCompressionEnabled) baseFileName + ".gz" else baseFileName)
               
-              val hadoopConf = pluginCtx.ask(ProfileInitMsg(executorId, outPath.toString))
+              val hadoopConf = pluginCtx.ask(new ProfileInitMsg(executorId, outPath.toString))
                 .asInstanceOf[SerializableConfiguration].value
               val fs = outPath.getFileSystem(hadoopConf)
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/basicPhysicalOperators.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/basicPhysicalOperators.scala
index afab2a5ae09..3ec1b932a19 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/basicPhysicalOperators.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/basicPhysicalOperators.scala
@@ -33,7 +33,6 @@ import com.nvidia.spark.rapids.jni.GpuSplitAndRetryOOM
 import com.nvidia.spark.rapids.shims._
 
 import org.apache.spark.{InterruptibleIterator, Partition, SparkContext, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions._
@@ -53,7 +52,7 @@ class GpuProjectExecMeta(
     conf: RapidsConf,
     p: Option[RapidsMeta[_, _, _]],
     r: DataFromReplacementRule) extends SparkPlanMeta[ProjectExec](proj, conf, p, r)
-    with Logging {
+    with RapidsLocalLog {
   override def convertToGpu(): GpuExec = {
     // Force list to avoid recursive Java serialization of lazy list Seq implementation
     val gpuExprs = childExprs.map(_.convertToGpu().asInstanceOf[NamedExpression]).toList
@@ -1012,7 +1011,7 @@ case class GpuProjectAstExec(
  *   Input columns for tier 3: a, c, e, f, ref2, ref3
  *   Tier 3: (ref2 * e), (ref3 * f), (a + e), (c + f)
  */
- case class GpuTieredProject(exprTiers: Seq[Seq[GpuExpression]]) {
+ class GpuTieredProject(val exprTiers: Seq[Seq[GpuExpression]]) extends Serializable {
 
   /**
    * Inject metrics into all expressions across all tiers.
@@ -1319,7 +1318,7 @@ object GpuFilter {
   }
 }
 
-case class GpuFilterExecMeta(
+class GpuFilterExecMeta(
   filter: FilterExec,
   override val conf: RapidsConf,
   parentMetaOpt: Option[RapidsMeta[_, _, _]],
@@ -1400,7 +1399,7 @@ class GpuSampleExecMeta(
     conf: RapidsConf,
     p: Option[RapidsMeta[_, _, _]],
     r: DataFromReplacementRule) extends SparkPlanMeta[SampleExec](sample, conf, p, r)
-    with Logging {
+    with RapidsLocalLog {
   override def convertToGpu(): GpuExec = {
     val gpuChild = childPlans.head.convertIfNeeded()
     if (conf.isFastSampleEnabled) {
@@ -1569,7 +1568,7 @@ private[rapids] class GpuRangeIterator(
     step: Long,
     maxRowCountPerBatch: Long,
     taskContext: TaskContext,
-    opTime: GpuMetric) extends Iterator[ColumnarBatch] with Logging {
+    opTime: GpuMetric) extends Iterator[ColumnarBatch] with RapidsLocalLog {
 
   // This iterator is designed for GpuRangeExec, so it has the requirement for the inputs.
   assert((partitionEnd - partitionStart) % step == 0)
@@ -1609,7 +1608,7 @@ private[rapids] class GpuRangeIterator(
       val remainingRows = (safePartitionEnd - start) / step
       // Start is inclusive so we need to produce at least one row
       val rowsExpected = Math.max(1, Math.min(remainingRows, maxRowCountPerBatch))
-      val iter = withRetry(AutoCloseableLong(rowsExpected), reduceRowsNumberByHalf) { rows =>
+      val iter = withRetry(new AutoCloseableLong(rowsExpected), reduceRowsNumberByHalf) { rows =>
         withResource(Scalar.fromLong(start)) { startScalar =>
           withResource(Scalar.fromLong(step)) { stepScalar =>
             withResource(
@@ -1658,12 +1657,12 @@ private[rapids] class GpuRangeIterator(
           throw new GpuSplitAndRetryOOM(s"GPU OutOfMemory: the number of rows generated is" +
             s" too small to be split ${rowsNumber.value}!")
         }
-        Seq(AutoCloseableLong(rowsNumber.value / 2))
+        Seq(new AutoCloseableLong(rowsNumber.value / 2))
       }
     }
 
   /** A bridge class between Long and AutoCloseable for retry */
-  case class AutoCloseableLong(value: Long) extends AutoCloseable {
+  class AutoCloseableLong(val value: Long) extends AutoCloseable {
     override def close(): Unit = { /* Nothing to be closed */ }
   }
 }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/dataSourceUtil.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/dataSourceUtil.scala
index aee11b3c84d..436a6b90f10 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/dataSourceUtil.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/dataSourceUtil.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -40,18 +40,6 @@ class PartitionIterator[T](reader: PartitionReader[T]) extends Iterator[T] {
   }
 }
 
-class MetricsBatchIterator(iter: Iterator[ColumnarBatch]) extends Iterator[ColumnarBatch] {
-  private[this] val inputMetrics = TaskContext.get().taskMetrics().inputMetrics
-
-  override def hasNext: Boolean = iter.hasNext
-
-  override def next(): ColumnarBatch = {
-    val batch = iter.next()
-    TrampolineUtil.incInputRecordsRows(inputMetrics, batch.numRows())
-    batch
-  }
-}
-
 /** Wraps a columnar PartitionReader to update bytes read metric based on filesystem statistics. */
 class PartitionReaderWithBytesRead(reader: PartitionReader[ColumnarBatch])
     extends PartitionReader[ColumnarBatch] {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/fileio/hadoop/S3InputFile.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/fileio/hadoop/S3InputFile.scala
deleted file mode 100644
index 3a8c7ed9185..00000000000
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/fileio/hadoop/S3InputFile.scala
+++ /dev/null
@@ -1,91 +0,0 @@
-/*
- * Copyright (c) 2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package com.nvidia.spark.rapids.fileio.hadoop
-
-import java.io.IOException
-import java.net.URI
-import java.util.OptionalLong
-
-import scala.collection.JavaConverters._
-
-import ai.rapids.cudf.HostMemoryBuffer
-import com.nvidia.spark.rapids.{IntRangeWithOffset, PerfIO, RangeWithOffset, SuffixRangeWithOffset}
-import com.nvidia.spark.rapids.jni.fileio.{RapidsInputFile, SeekableInputStream}
-import org.apache.hadoop.conf.Configuration
-import org.apache.hadoop.fs.Path
-
-/**
- * S3-backed {@link RapidsInputFile} for Hadoop-conf-driven (non-iceberg) reads.
- * {@code readVectored} issues batched byte-range GETs through the optimized
- * vectored-read path; the other operations delegate to the standard
- * {@link HadoopInputFile}.
- */
-class S3InputFile private (
-    delegate: HadoopInputFile,
-    fileUri: URI,
-    hadoopConf: Configuration)
-  extends RapidsInputFile {
-
-  override def path(): String = delegate.path()
-
-  @throws[IOException]
-  override def getLength(): Long = delegate.getLength()
-
-  @throws[IOException]
-  override def getLastModificationTime(): OptionalLong = delegate.getLastModificationTime()
-
-  @throws[IOException]
-  override def open(): SeekableInputStream = delegate.open()
-
-  @throws[IOException]
-  override def readVectored(
-      output: HostMemoryBuffer,
-      copyRanges: java.util.List[RapidsInputFile.CopyRange]): Unit = {
-    val ranges = copyRanges.asScala.map { r =>
-      IntRangeWithOffset(r.getInputOffset, r.getLength, r.getOutputOffset)
-    }.toSeq
-    require(
-      PerfIO.readToHostMemory(hadoopConf, output, fileUri, ranges).isDefined,
-      "expected to use PerfIO to read")
-  }
-
-  /**
-   * Issue a single suffix-range {@code GetObject} ({@code Range: bytes=-N}) for
-   * the last {@code length} bytes. Avoids the {@code getLength()} round-trip the
-   * default {@link RapidsInputFile#readTail} would make.
-   */
-  @throws[IOException]
-  override def readTail(length: Long, output: HostMemoryBuffer): Unit = {
-    if (length == 0) {
-      return
-    }
-    if (length < 0) {
-      throw new IllegalArgumentException("length must be non-negative")
-    }
-    val ranges = Seq[RangeWithOffset](SuffixRangeWithOffset(length, /*destOffset*/ 0L))
-    require(
-      PerfIO.readToHostMemory(hadoopConf, output, fileUri, ranges).isDefined,
-      "expected to use PerfIO to read")
-  }
-}
-
-object S3InputFile {
-  @throws[IOException]
-  def create(filePath: Path, conf: Configuration): S3InputFile = {
-    new S3InputFile(HadoopInputFile.create(filePath, conf), filePath.toUri, conf)
-  }
-}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/higherOrderFunctions.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/higherOrderFunctions.scala
index ae23430a90b..7364ef7ce2a 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/higherOrderFunctions.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/higherOrderFunctions.scala
@@ -28,6 +28,7 @@ import com.nvidia.spark.rapids.shims.ShimExpression
 import org.apache.spark.sql.catalyst.analysis.TypeCoercion
 import org.apache.spark.sql.catalyst.expressions.{Add, And, ArrayAggregate, Attribute, AttributeReference, AttributeSeq, CaseWhen, Cast, Expression, ExprId, Greatest, If, LambdaFunction, Least, Literal, Multiply, NamedExpression, NamedLambdaVariable, Or}
 import org.apache.spark.sql.internal.SQLConf
+import org.apache.spark.sql.rapids.GpuMapDedupPolicy
 import org.apache.spark.sql.types.{ArrayType, BooleanType, ByteType, DataType, Decimal, DecimalType, DoubleType, FloatType, IntegerType, LongType, MapType, Metadata, NumericType, ShortType, StructField, StructType}
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
@@ -527,8 +528,7 @@ case class GpuTransformKeys(
   override def prettyName: String = "transform_keys"
 
   // Spark 4.1+ returns an enum value instead of String, so use toString first
-  private def exceptionOnDupKeys =
-    SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY).toString.toUpperCase == "EXCEPTION"
+  private def exceptionOnDupKeys = GpuMapDedupPolicy.isException
 
   override lazy val hasSideEffects: Boolean =
     function.nullable || exceptionOnDupKeys || super.hasSideEffects
@@ -1140,13 +1140,13 @@ case object AnyOp extends AggOp {
  * @param accVarExprId   the accumulator NamedLambdaVariable's exprId
  * @param elemVar        the element NamedLambdaVariable (used to build the g lambda)
  */
-case class ArrayAggregateDecomposition(
-    op: AggOp,
-    g: Expression,
-    accVarExprId: ExprId,
-    elemVar: NamedLambdaVariable)
+class ArrayAggregateDecomposition(
+    val op: AggOp,
+    val g: Expression,
+    val accVarExprId: ExprId,
+    val elemVar: NamedLambdaVariable) extends Serializable
 
-private case class ExtractedG(g: Expression, hasBareAccBranch: Boolean)
+private class ExtractedG(val g: Expression, val hasBareAccBranch: Boolean) extends Serializable
 
 
 /**
@@ -1223,7 +1223,7 @@ object ArrayAggregateDecomposer {
         "that no-contribution branch into an identity value")
     }
 
-    Right(ArrayAggregateDecomposition(op, g, accId, elemVar))
+    Right(new ArrayAggregateDecomposition(op, g, accId, elemVar))
   }
 
   /**
@@ -1246,8 +1246,8 @@ object ArrayAggregateDecomposer {
       accId: ExprId,
       op: AggOp): Option[ExtractedG] = {
     op.matchBinary(unwrapDecimalPatternWrappers(e)).flatMap { case (l, r) =>
-      if (isAccRef(l, accId) && !containsAccRef(r, accId)) Some(ExtractedG(r, false))
-      else if (isAccRef(r, accId) && !containsAccRef(l, accId)) Some(ExtractedG(l, false))
+      if (isAccRef(l, accId) && !containsAccRef(r, accId)) Some(new ExtractedG(r, false))
+      else if (isAccRef(r, accId) && !containsAccRef(l, accId)) Some(new ExtractedG(l, false))
       else None
     }
   }
@@ -1264,7 +1264,7 @@ object ArrayAggregateDecomposer {
       op: AggOp,
       accType: DataType): Option[ExtractedG] = {
     if (isAccRef(branch, accId)) {
-      Some(ExtractedG(op.identityLiteral(accType), true))
+      Some(new ExtractedG(op.identityLiteral(accType), true))
     } else {
       extractG(branch, accId, op, accType)
     }
@@ -1279,7 +1279,7 @@ object ArrayAggregateDecomposer {
       for {
         tG <- extractBranch(t, accId, op, accType)
         fG <- extractBranch(f, accId, op, accType)
-      } yield ExtractedG(If(cond, tG.g, fG.g), tG.hasBareAccBranch || fG.hasBareAccBranch)
+      } yield new ExtractedG(If(cond, tG.g, fG.g), tG.hasBareAccBranch || fG.hasBareAccBranch)
 
     case CaseWhen(branches, Some(elseValue))
         if branches.forall { case (c, _) => !containsAccRef(c, accId) } =>
@@ -1292,7 +1292,7 @@ object ArrayAggregateDecomposer {
         val gBranches = branchDecs.map { case (c, dec) => (c, dec.get.g) }
         val hasBareAccBranch = branchDecs.exists(_._2.exists(_.hasBareAccBranch)) ||
           elseDec.exists(_.hasBareAccBranch)
-        Some(ExtractedG(CaseWhen(gBranches, Some(elseDec.get.g)), hasBareAccBranch))
+        Some(new ExtractedG(CaseWhen(gBranches, Some(elseDec.get.g)), hasBareAccBranch))
       }
 
     case _ => None
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/AsyncRunners.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/AsyncRunners.scala
index 29f8a4debcf..377ee3997de 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/AsyncRunners.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/AsyncRunners.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -35,7 +35,7 @@ sealed trait AsyncRunResource
 /**
  * HostResource represents host memory resource requirement for CPU-bound tasks.
  */
-case class HostResource(hostMemoryBytes: Long) extends AsyncRunResource
+class HostResource(val hostMemoryBytes: Long) extends AsyncRunResource with Serializable
 
 /**
  * DeviceResource is a marker object for GPU resources, no additional fields needed.
@@ -44,7 +44,7 @@ object DeviceResource extends AsyncRunResource
 
 object AsyncRunResource {
   def newCpuResource(hostMemoryBytes: Long): AsyncRunResource = {
-    HostResource(hostMemoryBytes)
+    new HostResource(hostMemoryBytes)
   }
 
   def newGpuResource(): AsyncRunResource = DeviceResource
@@ -76,8 +76,6 @@ trait AsyncResult[T] extends AutoCloseable {
   }
 }
 
-case class AsyncMetrics(scheduleTimeMs: Long, executionTimeMs: Long)
-
 class AsyncMetricsBuilder {
   private var scheduleTimeMs: Long = 0L
   private var executionTimeMs: Long = 0L
@@ -93,7 +91,7 @@ class AsyncMetricsBuilder {
   }
 
   def build(): AsyncMetrics = {
-    AsyncMetrics(scheduleTimeMs, executionTimeMs)
+    new AsyncMetrics(scheduleTimeMs, executionTimeMs)
   }
 }
 
@@ -136,19 +134,19 @@ class DecayReleaseResult[T](override val data: T,
  */
 sealed trait AsyncRunnerState
 
-case class Init(firstTime: Boolean) extends AsyncRunnerState
+class Init(val firstTime: Boolean) extends AsyncRunnerState with Serializable
 
 case object Pending extends AsyncRunnerState
 
-case class ScheduleFailed(exception: Throwable) extends AsyncRunnerState
+class ScheduleFailed(val exception: Throwable) extends AsyncRunnerState with Serializable
 
 case object Running extends AsyncRunnerState
 
 case object Completed extends AsyncRunnerState
 
-case class ExecFailed(exception: Throwable) extends AsyncRunnerState
+class ExecFailed(val exception: Throwable) extends AsyncRunnerState with Serializable
 
-case class Closed(exception: Option[Throwable]) extends AsyncRunnerState
+class Closed(val exception: Option[Throwable]) extends AsyncRunnerState with Serializable
 
 case object Cancelled extends AsyncRunnerState
 
@@ -271,7 +269,7 @@ trait AsyncRunner[T] extends Callable[AsyncResult[T]] {
     }
   }
 
-  @volatile private var state: AsyncRunnerState = Init(firstTime = true)
+  @volatile private var state: AsyncRunnerState = new Init(firstTime = true)
 
   def isHoldingStateLock: Boolean = stateLock.isHeldByCurrentThread
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourceBoundedThreadExecutor.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourceBoundedThreadExecutor.scala
index eee1eaceb4c..48b0994b9b7 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourceBoundedThreadExecutor.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourceBoundedThreadExecutor.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,7 +21,6 @@ import java.util.concurrent.{BlockingQueue, Callable, Future, FutureTask, Priori
 import com.google.common.util.concurrent.ThreadFactoryBuilder
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.util.TaskCompletionListener
 
@@ -37,7 +36,11 @@ import org.apache.spark.util.TaskCompletionListener
  * @tparam T the result type returned by the AsyncRunner
  */
 class RapidsFutureTask[T](val runner: AsyncRunner[T])
-    extends FutureTask[AsyncResult[T]](runner) with Logging {
+    extends FutureTask[AsyncResult[T]](runner) {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[RapidsFutureTask[_]])
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
 
   override def run(): Unit = runner.withStateLock { rr =>
     rr.getState match {
@@ -61,14 +64,14 @@ class RapidsFutureTask[T](val runner: AsyncRunner[T])
         } else {
           // Failed due to unexpected exceptions
           val ex = new IllegalStateException("runner failed unexpectedly")
-          rr.setState(ExecFailed(ex))
+          rr.setState(new ExecFailed(ex))
         }
 
       // Throw the ScheduleFailed exception within the scope of `FutureTask.run`, so that
       // the exception can be properly recorded and propagated to the caller of `get()`.
-      case ScheduleFailed(ex: Throwable) =>
+      case failed: ScheduleFailed =>
         // Trick: register a pre-hook to let `AsyncRunner.call` throw the exception
-        rr.addPreHook(() => throw ex)
+        rr.addPreHook(() => throw failed.exception)
         super.run()
 
       // Handle the cancelled case as a special kind of ScheduleFailed
@@ -86,7 +89,7 @@ class RapidsFutureTask[T](val runner: AsyncRunner[T])
   }
 
   override def setException(e: Throwable): Unit = {
-    runner.setState(ExecFailed(e))
+    runner.setState(new ExecFailed(e))
     super.setException(e)
   }
 
@@ -144,7 +147,21 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
     workQueue: BlockingQueue[Runnable],
     threadFactory: ThreadFactory,
     keepAliveTime: Long = 100L) extends ThreadPoolExecutor(corePoolSize,
-  maximumPoolSize, keepAliveTime, TimeUnit.SECONDS, workQueue, threadFactory) with Logging {
+  maximumPoolSize, keepAliveTime, TimeUnit.SECONDS, workQueue, threadFactory) {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[ResourceBoundedThreadExecutor])
+
+  private def logInfo(msg: => String): Unit = if (log.isInfoEnabled) log.info(msg)
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
+
+  private def logError(msg: => String): Unit = if (log.isErrorEnabled) log.error(msg)
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) log.error(msg, throwable)
+  }
 
   logInfo(s"Creating ResourceBoundedThreadExecutor with resourcePool: ${mgr.toString}, " +
       s"corePoolSize: $corePoolSize, maximumPoolSize: $maximumPoolSize, " +
@@ -209,7 +226,7 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
       rr.getState match {
         // Cancelled case: Cancelled -> ScheduleFailed
         case Cancelled =>
-          rr.setState(ScheduleFailed(new IllegalStateException("cancelled")))
+          rr.setState(new ScheduleFailed(new IllegalStateException("cancelled")))
           logWarning(s"Runner being cancelled ahead of execution: $rr")
 
         // The main path: Init -> Pending -> Running | Pending | ScheduleFailed
@@ -229,9 +246,9 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
               rr.setState(Running)
               futTask.scheduleTime += s.elapsedTime
             // Fail the scheduling: Pending -> ScheduleFailed
-            case AcquireExcepted(ex) =>
-              rr.setState(ScheduleFailed(ex))
-              logError(s"$ex [$rr]")
+            case excepted: AcquireExcepted =>
+              rr.setState(new ScheduleFailed(excepted.exception))
+              logError(s"${excepted.exception} [$rr]")
             // Bypass the execution: Pending -> Pending
             case AcquireFailed =>
           }
@@ -241,7 +258,7 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
           // If we throw an exception here, it will crash the ThreadWorker without signaling
           // the caller. So we just mark the state as ScheduleFailed to pass the exception to
           // the caller via FutureTask.get().
-          rr.setState(ScheduleFailed(new IllegalStateException("Unexpected state")))
+          rr.setState(new ScheduleFailed(new IllegalStateException("Unexpected state")))
           logError(s"Unexpected state before schedule: $rr")
       }
     }
@@ -255,7 +272,7 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
       // and recorded the exception internally.
       if (t != null) {
         if (!rr.getState.isInstanceOf[ExecFailed]) {
-          rr.setState(ExecFailed(t))
+          rr.setState(new ExecFailed(t))
         }
         // Also try to fail the Spark task which launched this runner.
         rr.sparkTaskContext.foreach { ctx =>
@@ -268,7 +285,7 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
       // Post execution state handling
       rr.getState match {
         case Cancelled | // very rare case: cancelled between execution and afterExecute
-             ExecFailed(_) => // failed execution (ScheduleFailed should be cast to ExecFailed)
+             _: ExecFailed => // failed execution (ScheduleFailed should be cast to ExecFailed)
           // release holding resource immediately on exception
           if (rr.isHoldingResource) {
             rr.releaseResourceCallback()
@@ -290,7 +307,7 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
           require(!rr.isHoldingResource, s"Pending state should NOT hold Resource: $rr")
           // Requeue runners which failed to acquire resource and bypassed the execution.
           futTask.scheduleTime += timeoutMs * 1000000L
-          rr.setState(Init(firstTime = false)) // reset to Init state for re-scheduling
+          rr.setState(new Init(firstTime = false)) // reset to Init state for re-scheduling
           // Re-add the task to the work queue for re-execution
           if (!workQueue.add(futTask)) {
             // Fatal error
@@ -334,11 +351,11 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
           // Finalize the runner state
           state match {
             case Completed => // Completed -> Closed
-              rr.setState(Closed(None))
-            case ExecFailed(ex) => // ExecFailed -> Closed
-              rr.setState(Closed(Some(ex)))
+              rr.setState(new Closed(None))
+            case failed: ExecFailed => // ExecFailed -> Closed
+              rr.setState(new Closed(Some(failed.exception)))
             case Cancelled => // Cancelled -> Closed
-              rr.setState(Closed(Some(new IllegalStateException("cancelled"))))
+              rr.setState(new Closed(Some(new IllegalStateException("cancelled"))))
             case _ =>
               throw new IllegalStateException(s"Should NOT reach here: $rr")
           }
@@ -364,12 +381,12 @@ class ResourceBoundedThreadExecutor(mgr: ResourcePool,
           // 2. Mark the runner as Cancelled
           fut.runner.withStateLock { rr =>
             rr.getState match {
-              case Init(_) => rr.setState(Cancelled) // Init -> Cancelled
+              case _: Init => rr.setState(Cancelled) // Init -> Cancelled
               case Pending => rr.setState(Cancelled) // Pending -> Cancelled
               case Running => rr.setState(Cancelled) // Running -> Cancelled
-              case ScheduleFailed(_) => rr.setState(Cancelled) // ScheduleFailed -> Cancelled
+              case _: ScheduleFailed => rr.setState(Cancelled) // ScheduleFailed -> Cancelled
               case Completed => rr.setState(Cancelled) // Completed -> Cancelled
-              case Cancelled | ExecFailed(_) | Closed(_) => // do nothing
+              case Cancelled | _: ExecFailed | _: Closed => // do nothing
             }
           }
           // 3. If the runner is still holding resource, we release it
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourcePools.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourcePools.scala
index 5023d53f551..efa195183a6 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourcePools.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ResourcePools.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,7 +22,6 @@ import java.util.concurrent.locks.ReentrantLock
 
 import scala.collection.mutable
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.execution.TrampolineUtil.bytesToString
 
 // Being thrown when a task requests resources that are not valid or exceed the limits
@@ -32,13 +31,13 @@ class InvalidResourceRequest(msg: String) extends RuntimeException(
 // Represents the status of acquiring resources for a task
 sealed trait AcquireStatus
 
-case class AcquireSuccessful(elapsedTime: Long) extends AcquireStatus
+class AcquireSuccessful(val elapsedTime: Long) extends AcquireStatus with Serializable
 
 // AcquireFailed indicates that the task could not be scheduled due to resource constraints
 case object AcquireFailed extends AcquireStatus
 
 // AcquireExcepted indicates that an exception occurred while trying to acquire resources
-case class AcquireExcepted(exception: Throwable) extends AcquireStatus
+class AcquireExcepted(val exception: Throwable) extends AcquireStatus with Serializable
 
 /**
  * ResourceManager interface to be implemented for AsyncRunners requiring different kinds of
@@ -68,7 +67,13 @@ trait ResourcePool {
  * The implementation uses condition variables to efficiently block and wake up waiting
  * tasks when resources become available through task completion and resource release.
  */
-class HostMemoryPool(val maxHostMemoryBytes: Long) extends ResourcePool with Logging {
+class HostMemoryPool(val maxHostMemoryBytes: Long) extends ResourcePool {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[HostMemoryPool])
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
 
   private val lock = new ReentrantLock()
 
@@ -94,7 +99,7 @@ class HostMemoryPool(val maxHostMemoryBytes: Long) extends ResourcePool with Log
     // step 2: try to acquire the resource with blocking and timeout
     // 2.1 If no resource needed, acquire immediately
     if (memoryRequire == 0L) {
-      AcquireSuccessful(elapsedTime = 0L)
+      new AcquireSuccessful(elapsedTime = 0L)
     }
     // 2.2 The main path for acquiring resource with blocking and timeout
     else {
@@ -160,10 +165,10 @@ class HostMemoryPool(val maxHostMemoryBytes: Long) extends ResourcePool with Log
               s"Over-committed HostMemoryPool: exceeded_amount=${bytesToString(-remaining)}, " +
                   s"AsyncRunners=$numRunnerInPool, SparkTasks=${tasksInPool.size}")
           }
-          AcquireSuccessful(elapsedTime = timeoutNs - waitTimeNs)
+          new AcquireSuccessful(elapsedTime = timeoutNs - waitTimeNs)
         }
       } catch {
-        case ex: Throwable => AcquireExcepted(ex)
+        case ex: Throwable => new AcquireExcepted(ex)
       } finally {
         lock.unlock()
       }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ThrottlingExecutor.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ThrottlingExecutor.scala
index 2c799f1cd39..54460afd9bb 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ThrottlingExecutor.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/io/async/ThrottlingExecutor.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,15 +21,6 @@ import java.util.concurrent.{Callable, ExecutorService, Future, TimeUnit}
 import org.apache.spark.sql.rapids.{ColumnarWriteTaskStatsTracker, GpuWriteTaskStatsTracker}
 
 
-/**
- * Stats related classes used by ThrottlingExecutor
- */
-case class ThrottlingExecutorStats (
-    var numTasksScheduled: Int,
-    var accumulatedThrottleTimeNs: Long,
-    var minThrottleTimeNs: Long,
-    var maxThrottleTimeNs: Long)
-
 /**
  * Only for GpuWriteTaskStatsTracker cases
  */
@@ -53,7 +44,7 @@ class StatsUpdaterForWriteFunc(val statsTrackers: Seq[ColumnarWriteTaskStatsTrac
 class ThrottlingExecutor(executor: ExecutorService, throttler: TrafficController,
     updateStats : ThrottlingExecutorStats => Unit) {
 
-  val stats: ThrottlingExecutorStats = ThrottlingExecutorStats(0, 0L, Long.MaxValue, 0L)
+  val stats: ThrottlingExecutorStats = new ThrottlingExecutorStats(0, 0L, Long.MaxValue, 0L)
 
   private def blockUntilTaskRunnable(task: Task[_]): Unit = {
     val blockStart = System.nanoTime()
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/limit.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/limit.scala
index dd8e4f3adda..2ffb973cd63 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/limit.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/limit.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -453,7 +453,7 @@ case class GpuTopN(
   }
 }
 
-case class GpuTakeOrderedAndProjectExecMeta(
+class GpuTakeOrderedAndProjectExecMeta(
    takeExec: TakeOrderedAndProjectExec,
    rapidsConf: RapidsConf,
    parentOpt: Option[RapidsMeta[_, _, _]],
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/literals.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/literals.scala
index fc6566dc222..0546bb5d36c 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/literals.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/literals.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -29,28 +29,26 @@ import ai.rapids.cudf.{ColumnVector, DType, HostColumnVector, Scalar}
 import ai.rapids.cudf.ast
 import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.RapidsPluginImplicits.AutoCloseableProducingArray
-import com.nvidia.spark.rapids.shims.{GpuTypeShims, SparkShimImpl}
+import com.nvidia.spark.rapids.shims.{GpuLiteralShim, GpuTypeShims, SparkShimImpl}
 import org.apache.commons.codec.binary.{Hex => ApacheHex}
-import org.json4s.JsonAST.{JField, JNull, JString}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Literal, UnsafeArrayData}
 import org.apache.spark.sql.catalyst.util.{ArrayData, DateTimeUtils, MapData, TimestampFormatter}
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.ColumnarBatch
 import org.apache.spark.unsafe.types.UTF8String
 
 
 
-object GpuScalar extends Logging {
+object GpuScalar {
+  private[this] val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
 
   // TODO Support interpreting the value to a Spark DataType
   def extract(v: Scalar): Any = {
     if (v != null && v.isValid) {
-      logDebug(s"Extracting data from the Scalar $v.")
+      log.debug(s"Extracting data from the Scalar $v.")
       v.getType match {
         case DType.BOOL8 => v.getBoolean
         case DType.FLOAT32 => v.getFloat
@@ -643,7 +641,7 @@ object GpuLiteral {
 /**
  * In order to do type conversion and checking, use GpuLiteral.create() instead of constructor.
  */
-case class GpuLiteral (value: Any, dataType: DataType) extends GpuLeafExpression {
+case class GpuLiteral (value: Any, dataType: DataType) extends GpuLiteralShim {
 
   // Assume this came from Spark Literal and no need to call Literal.validateLiteralValue here.
 
@@ -676,18 +674,6 @@ case class GpuLiteral (value: Any, dataType: DataType) extends GpuLeafExpression
     case _ => false
   }
 
-  override protected def jsonFields: List[JField] = {
-    // Turns all kinds of literal values to string in json field, as the type info is hard to
-    // retain in json format, e.g. {"a": 123} can be an int, or double, or decimal, etc.
-    val jsonValue = (value, dataType) match {
-      case (null, _) => JNull
-      case (i: Int, DateType) => JString(DateTimeUtils.toJavaDate(i).toString)
-      case (l: Long, TimestampType) => JString(DateTimeUtils.toJavaTimestamp(l).toString)
-      case (other, _) => JString(other.toString)
-    }
-    ("value" -> jsonValue) :: ("dataType" -> TrampolineUtil.jsonValue(dataType)) :: Nil
-  }
-
   override def sql: String = (value, dataType) match {
     case (_, NullType | _: ArrayType | _: MapType | _: StructType) if value == null => "NULL"
     case _ if value == null => s"CAST(NULL AS ${dataType.sql})"
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/GpuLore.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/GpuLore.scala
index fb9e042900c..3aa4d586021 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/GpuLore.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/GpuLore.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -31,7 +31,6 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkEnv
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.expressions.Attribute
 import org.apache.spark.sql.catalyst.trees.TreeNodeTag
@@ -42,9 +41,14 @@ import org.apache.spark.sql.rapids.shims.SparkSessionUtils
 import org.apache.spark.sql.types.DataType
 import org.apache.spark.util.SerializableConfiguration
 
-case class LoreRDDMeta(numPartitions: Int, outputPartitions: Seq[Int], attrs: Seq[Attribute])
+class LoreRDDMeta(
+    val numPartitions: Int,
+    val outputPartitions: Seq[Int],
+    val attrs: Seq[Attribute]) extends Serializable
 
-case class LoreRDDPartitionMeta(numBatches: Int, dataType: Seq[DataType])
+class LoreRDDPartitionMeta(
+    val numBatches: Int,
+    val dataType: Seq[DataType]) extends Serializable
 
 trait GpuLoreRDD {
   def rootPath: Path
@@ -64,7 +68,17 @@ trait GpuLoreRDD {
   }
 }
 
-object GpuLore extends Logging {
+object GpuLore {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    log.warn(msg, throwable)
+  }
+
   /**
    * Lore id of a plan node.
    */
@@ -262,12 +276,13 @@ object GpuLore extends Logging {
                 checkUnsupportedOperator(g)
                 val currentExecRootPath = new Path(loreOutputRootPath, s"loreId-$loreId")
                 registerTag(g, LORE_DUMP_PATH_TAG, currentExecRootPath.toString, tagRollbacks)
-                val loreOutputInfo = LoreOutputInfo(outputLoreIds,
+                val loreOutputInfo = new LoreOutputInfo(outputLoreIds,
                   currentExecRootPath.toString)
 
                 g.children.zipWithIndex.foreach {
                   case (child, idx) =>
-                    val dumpRDDInfo = LoreDumpRDDInfo(idx, loreOutputInfo, child.output, hadoopConf,
+                    val dumpRDDInfo = new LoreDumpRDDInfo(idx, loreOutputInfo, child.output,
+                      hadoopConf,
                       useOriginalSchemaNames = rapidsConf.loreParquetUseOriginalNames,
                       nonStrictMode = allowNonStrictMode)
                     child match {
@@ -335,7 +350,7 @@ object GpuLore extends Logging {
       tagRollbacks: mutable.ArrayBuffer[TagRollback], nonStrictMode: Boolean) = {
     val innerPlan = sub.plan.child
     if (innerPlan.isInstanceOf[GpuExec]) {
-      val dumpRDDInfo = LoreDumpRDDInfo(id, loreOutputInfo, innerPlan.output,
+      val dumpRDDInfo = new LoreDumpRDDInfo(id, loreOutputInfo, innerPlan.output,
         hadoopConf,
         useOriginalSchemaNames = RapidsConf.LORE_PARQUET_USE_ORIGINAL_NAMES
           .get(SparkSessionUtils.sessionFromPlan(innerPlan).sessionState.conf),
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/OutputLoreId.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/OutputLoreId.scala
index 28fa0b2dbbf..b7f4fe37c94 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/OutputLoreId.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/OutputLoreId.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -25,7 +25,7 @@ case class OutputLoreId(loreId: LoreId, partitionIds: Set[Int]) {
     partitionIds.contains(partitionId)
 }
 
-case class LoreOutputInfo(outputLoreId: OutputLoreId, pathStr: String) {
+class LoreOutputInfo(val outputLoreId: OutputLoreId, val pathStr: String) extends Serializable {
   def path: Path = new Path(pathStr)
 }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/dump.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/dump.scala
index 4c446cdd0cf..9ebdae964e8 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/dump.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/dump.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -27,7 +27,6 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.{Partition, SparkContext, TaskContext}
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Attribute
@@ -37,16 +36,16 @@ import org.apache.spark.sql.vectorized.ColumnarBatch
 import org.apache.spark.util.SerializableConfiguration
 
 
-case class LoreDumpRDDInfo(
-    idxInParent: Int,
-    loreOutputInfo: LoreOutputInfo,
-    attrs: Seq[Attribute],
-    hadoopConf: Broadcast[SerializableConfiguration],
-    useOriginalSchemaNames: Boolean = false,
-    nonStrictMode: Boolean = false)
+class LoreDumpRDDInfo(
+    val idxInParent: Int,
+    val loreOutputInfo: LoreOutputInfo,
+    val attrs: Seq[Attribute],
+    val hadoopConf: Broadcast[SerializableConfiguration],
+    val useOriginalSchemaNames: Boolean,
+    val nonStrictMode: Boolean) extends Serializable
 
 class GpuLoreDumpRDD(info: LoreDumpRDDInfo, input: RDD[ColumnarBatch])
-  extends RDD[ColumnarBatch](input) with GpuLoreRDD with Logging {
+  extends RDD[ColumnarBatch](input) with GpuLoreRDD {
   override def rootPath: Path = pathOfChild(info.loreOutputInfo.path, info.idxInParent)
   private val factDataTypes = info.attrs.map(_.dataType)
   lazy val kudoSerializer: KudoSerializer = new KudoSerializer(
@@ -54,7 +53,8 @@ class GpuLoreDumpRDD(info: LoreDumpRDDInfo, input: RDD[ColumnarBatch])
 
   def saveMeta(): Unit = {
     try {
-      val meta = LoreRDDMeta(input.getNumPartitions, this.getPartitions.map(_.index), info.attrs)
+      val meta = new LoreRDDMeta(input.getNumPartitions, this.getPartitions.map(_.index),
+        info.attrs)
       GpuLore.dumpObject(meta, pathOfMeta, this.context.hadoopConfiguration)
     } catch {
       case NonFatal(e) if (info.nonStrictMode) =>
@@ -87,9 +87,9 @@ class GpuLoreDumpRDD(info: LoreDumpRDDInfo, input: RDD[ColumnarBatch])
                   .isInstanceOf[KudoSerializedTableColumn])
               val partitionMeta = if (isFromShuffle) {
                 // get the array of dataType from the info.attrs
-                LoreRDDPartitionMeta(batchIdx, factDataTypes)
+                new LoreRDDPartitionMeta(batchIdx, factDataTypes)
               } else {
-                LoreRDDPartitionMeta(batchIdx, GpuColumnVector.extractTypes(ret))
+                new LoreRDDPartitionMeta(batchIdx, GpuColumnVector.extractTypes(ret))
               }
               GpuLore.dumpObject(partitionMeta, pathOfPartitionMeta(split.index),
                 info.hadoopConf.value.value)
@@ -161,7 +161,7 @@ class SimpleRDD(_sc: SparkContext, data: Broadcast[Any], schema: StructType) ext
 case class GpuLoreDumpExec(
     child: GpuExec,
     loreDumpInfo: LoreDumpRDDInfo)
-    extends ShimUnaryExecNode with GpuExec with Logging {
+    extends ShimUnaryExecNode with GpuExec {
 
   override def output: Seq[Attribute] = child.output
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/replay.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/replay.scala
index 27fad8ef5e8..68dca621ffb 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/replay.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/lore/replay.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -94,8 +94,8 @@ class GpuLoreReplayRDD(sc: SparkContext, rootPathStr: String,
   }
 
   override protected def getPartitions: Array[Partition] = {
-    (0 until loreRDDMeta.numPartitions).map(LoreReplayPartition).toArray
+    (0 until loreRDDMeta.numPartitions).map(new LoreReplayPartition(_)).toArray
   }
 }
 
-case class LoreReplayPartition(override val index: Int) extends Partition
+class LoreReplayPartition(override val index: Int) extends Partition
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/namedExpressions.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/namedExpressions.scala
index 249dae21c20..186d4f26c47 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/namedExpressions.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/namedExpressions.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,12 +21,10 @@ import java.util.Objects
 import ai.rapids.cudf.ColumnVector
 import ai.rapids.cudf.ast
 import com.nvidia.spark.rapids.RapidsPluginImplicits._
-import com.nvidia.spark.rapids.shims.SparkShimImpl
 
 import org.apache.spark.sql.catalyst.analysis.UnresolvedAttribute
 import org.apache.spark.sql.catalyst.expressions.{Attribute, AttributeReference, Expression, ExprId, Generator, NamedExpression}
 import org.apache.spark.sql.catalyst.plans.logical.EventTimeWatermark
-import org.apache.spark.sql.catalyst.util.quoteIdentifier
 import org.apache.spark.sql.types.{DataType, Metadata}
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
@@ -87,14 +85,9 @@ case class GpuAlias(child: Expression, name: String)(
   }
 
   override def sql: String = {
-    if (SparkShimImpl.hasAliasQuoteFix) {
-      val qualifierPrefix =
-        if (qualifier.nonEmpty) qualifier.map(quoteIfNeeded).mkString(".") + "." else ""
-      s"${child.sql} AS $qualifierPrefix${quoteIfNeeded(name)}"
-    } else {
-      val qualifierPrefix = if (qualifier.nonEmpty) qualifier.mkString(".") + "." else ""
-      s"${child.sql} AS $qualifierPrefix${quoteIdentifier(name)}"
-    }
+    val qualifierPrefix =
+      if (qualifier.nonEmpty) qualifier.map(quoteIfNeeded).mkString(".") + "." else ""
+    s"${child.sql} AS $qualifierPrefix${quoteIfNeeded(name)}"
   }
 
   private def quoteIfNeeded(part: String): String = {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/nullExpressions.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/nullExpressions.scala
index d9fba601f02..862f798873c 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/nullExpressions.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/nullExpressions.scala
@@ -21,9 +21,9 @@ import scala.collection.mutable
 import ai.rapids.cudf.{ast, BinaryOp, ColumnVector, ColumnView, DType, Scalar}
 import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.RapidsPluginImplicits._
-import com.nvidia.spark.rapids.shims.ShimExpression
+import com.nvidia.spark.rapids.shims.{ShimExpression, ShimPredicate}
 
-import org.apache.spark.sql.catalyst.expressions.{ComplexTypeMergingExpression, Expression, Predicate}
+import org.apache.spark.sql.catalyst.expressions.{ComplexTypeMergingExpression, Expression}
 import org.apache.spark.sql.types.{DataType, DoubleType, FloatType}
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
@@ -126,7 +126,7 @@ case class GpuCoalesce(children: Seq[Expression]) extends GpuExpression
  * UnaryOp
  */
 
-case class GpuIsNull(child: Expression) extends GpuUnaryExpression with Predicate {
+case class GpuIsNull(child: Expression) extends GpuUnaryExpression with ShimPredicate {
   override def nullable: Boolean = false
 
   override def sql: String = s"(${child.sql} IS NULL)"
@@ -140,7 +140,7 @@ case class GpuIsNull(child: Expression) extends GpuUnaryExpression with Predicat
   }
 }
 
-case class GpuIsNotNull(child: Expression) extends GpuUnaryExpression with Predicate {
+case class GpuIsNotNull(child: Expression) extends GpuUnaryExpression with ShimPredicate {
   override def nullable: Boolean = false
 
   override def sql: String = s"(${child.sql} IS NOT NULL)"
@@ -155,7 +155,7 @@ case class GpuIsNotNull(child: Expression) extends GpuUnaryExpression with Predi
   }
 }
 
-case class GpuIsNan(child: Expression) extends GpuUnaryExpression with Predicate {
+case class GpuIsNan(child: Expression) extends GpuUnaryExpression with ShimPredicate {
   override def nullable: Boolean = false
 
   override def sql: String = s"(${child.sql} IS NAN)"
@@ -192,7 +192,7 @@ case class GpuAtLeastNNonNulls(
     n: Int,
     exprs: Seq[Expression])
   extends GpuExpression with ShimExpression
-  with Predicate {
+  with ShimPredicate {
   override def nullable: Boolean = false
   override def foldable: Boolean = exprs.forall(_.foldable)
   override def toString: String = s"GpuAtLeastNNulls(n, ${children.mkString(",")})"
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetScan.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetScan.scala
index d0df36eebfc..95111d3944d 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetScan.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetScan.scala
@@ -18,7 +18,7 @@ package com.nvidia.spark.rapids.parquet
 
 import java.io.{Closeable, EOFException, FileNotFoundException, InputStream, IOException, OutputStream}
 import java.net.URI
-import java.nio.{ByteBuffer, ByteOrder}
+import java.nio.{Buffer, ByteBuffer, ByteOrder}
 import java.nio.channels.SeekableByteChannel
 import java.nio.charset.StandardCharsets
 import java.util.{Collections, Locale}
@@ -39,6 +39,7 @@ import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.RmmRapidsRetryIterator.withRetryNoSplit
 import com.nvidia.spark.rapids.filecache.FileCache
 import com.nvidia.spark.rapids.fileio.hadoop.HadoopFileIO
+import com.nvidia.spark.rapids.fileio.hadoop.PerfIOHadoopInputFileFactory
 import com.nvidia.spark.rapids.io.async._
 import com.nvidia.spark.rapids.jni.{DateTimeRebase, ParquetFooter, RmmSpark}
 import com.nvidia.spark.rapids.jni.fileio.{RapidsFileIO, RapidsInputFile}
@@ -66,7 +67,6 @@ import org.xerial.snappy.Snappy
 
 import org.apache.spark.TaskContext
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.Expression
@@ -117,7 +117,7 @@ case class GpuParquetScan(
     dataFilters: Seq[Expression],
     rapidsConf: RapidsConf,
     queryUsesInputFile: Boolean = false)
-  extends FileScan with GpuScan with Logging {
+  extends FileScan with GpuScan {
 
   override def isSplitable(path: Path): Boolean = true
 
@@ -428,14 +428,14 @@ class HMBSeekableInputStream(
     if (bytesRead < 0) {
       bytesRead
     } else {
-      buf.position(buf.position() + bytesRead)
+      buf.asInstanceOf[Buffer].position(buf.position() + bytesRead)
       bytesRead
     }
   }
 
   private def readFullyHeapBuffer(buf: ByteBuffer): Unit = {
     readFully(buf.array, buf.arrayOffset + buf.position(), buf.remaining)
-    buf.position(buf.limit)
+    buf.asInstanceOf[Buffer].position(buf.limit)
   }
 
   private def readDirectBuffer(buf: ByteBuffer): Int = {
@@ -492,7 +492,7 @@ class HMBInputFile(buffer: HostMemoryBuffer) extends InputFile {
 
 protected case class GpuParquetFileFilterHandler(
     @transient sqlConf: SQLConf,
-    metrics: Map[String, GpuMetric]) extends Logging {
+    metrics: Map[String, GpuMetric]) extends RapidsLocalLog {
 
   private val FOOTER_LENGTH_SIZE = 4
   private val isCaseSensitive = sqlConf.caseSensitiveAnalysis
@@ -1142,7 +1142,9 @@ abstract class AbstractGpuParquetMultiFilePartitionReaderFactory(
   // from a task when we need to create the fileIO instance. This stops a regression
   // when we materialize the hadoop conf eagerly, see:
   // https://github.com/NVIDIA/spark-rapids/issues/13353
-  @transient protected lazy val fileIO = new HadoopFileIO(broadcastedConf.value.value)
+  @transient protected lazy val fileIO = new HadoopFileIO(
+    broadcastedConf.value.value,
+    PerfIOHadoopInputFileFactory.INSTANCE)
   protected val isCaseSensitive = sqlConf.caseSensitiveAnalysis
   protected val debugDumpPrefix = rapidsConf.parquetDebugDumpPrefix
   protected val debugDumpAlways = rapidsConf.parquetDebugDumpAlways
@@ -1231,7 +1233,7 @@ abstract class AbstractGpuParquetMultiFilePartitionReaderFactory(
       filterHandler.filterBlocks(fileIO, footerReadType, file, new Configuration(conf),
         filters, readDataSchema)
     }
-    val combineConf = CombineConf(combineThresholdSize, combineWaitTime)
+    val combineConf = new CombineConf(combineThresholdSize, combineWaitTime)
     val poolConf = poolConfBuilder.build()
     val reader = createBaseMultiFileCloudReader(fileIO, conf, files, filterFunc,
       isCaseSensitive,
@@ -1292,7 +1294,7 @@ abstract class AbstractGpuParquetMultiFilePartitionReaderFactory(
       conf: Configuration,
       filters: Array[Filter],
       readDataSchema: StructType) extends UnboundedAsyncRunner[Array[BlockMetaWithPartFile]]
-      with Logging {
+      with RapidsLocalLog {
 
     override def callImpl(): Array[BlockMetaWithPartFile] = {
       TrampolineUtil.setTaskContext(taskContext)
@@ -1359,11 +1361,11 @@ abstract class AbstractGpuParquetMultiFilePartitionReaderFactory(
         metaAndFilesArr.foreach { metaAndFile =>
           val singleFileInfo = metaAndFile.meta
           clippedBlocks ++= singleFileInfo.blocks.map(block =>
-            ParquetSingleDataBlockMeta(
+            new ParquetSingleDataBlockMeta(
               singleFileInfo.filePath,
-              ParquetDataBlock(block, compressCfg),
+              new ParquetDataBlock(block, compressCfg),
               metaAndFile.file.partitionValues,
-              ParquetSchemaWrapper(singleFileInfo.schema),
+              new ParquetSchemaWrapper(singleFileInfo.schema),
               singleFileInfo.readSchema,
               new ParquetExtraInfo(singleFileInfo.dateRebaseMode,
                 singleFileInfo.timestampRebaseMode,
@@ -1474,7 +1476,9 @@ abstract class GpuParquetPartitionReaderFactoryBase(
   // from a task when we need to create the fileIO instance. This stops a regression
   // when we materialize the hadoop conf eagerly, see:
   // https://github.com/NVIDIA/spark-rapids/issues/13353
-  @transient protected lazy val fileIO = new HadoopFileIO(broadcastedConf.value.value)
+  @transient protected lazy val fileIO = new HadoopFileIO(
+    broadcastedConf.value.value,
+    PerfIOHadoopInputFileFactory.INSTANCE)
   protected val isCaseSensitive = sqlConf.caseSensitiveAnalysis
   protected val debugDumpPrefix = rapidsConf.parquetDebugDumpPrefix
   protected val debugDumpAlways = rapidsConf.parquetDebugDumpAlways
@@ -1524,7 +1528,7 @@ case class GpuParquetPartitionReaderFactory(
     @transient params: Map[String, String])
   extends GpuParquetPartitionReaderFactoryBase(
     sqlConf, broadcastedConf, dataSchema, readDataSchema, partitionSchema,
-    rapidsConf, metrics, params) with Logging {
+    rapidsConf, metrics, params) with RapidsLocalLog {
 
   override protected def buildBaseColumnarParquetReader(
       file: PartitionedFile): PartitionReader[ColumnarBatch] = {
@@ -1563,7 +1567,7 @@ object CpuCompressionConfig {
   def disabled(): CpuCompressionConfig = CpuCompressionConfig(false, false)
 }
 
-trait ParquetPartitionReaderBase extends Logging with ScanWithMetrics
+trait ParquetPartitionReaderBase extends RapidsLocalLog with ScanWithMetrics
     with MultiFileReaderFunctions {
   // the size of Parquet magic (at start+end) and footer length values
   val PARQUET_META_SIZE: Long = 4 + 4 + 4
@@ -2254,21 +2258,21 @@ trait ParquetPartitionReaderBase extends Logging with ScanWithMetrics
     block.asInstanceOf[ParquetDataBlock].dataBlock
 
   implicit def toDataBlockBase(blocks: Seq[BlockMetaData]): Seq[DataBlockBase] =
-    blocks.map(b => ParquetDataBlock(b, compressCfg))
+    blocks.map(b => new ParquetDataBlock(b, compressCfg))
 
   implicit def toBlockMetaDataSeq(blocks: Seq[DataBlockBase]): Seq[BlockMetaData] =
     blocks.map(_.asInstanceOf[ParquetDataBlock].dataBlock)
 }
 
 // Parquet schema wrapper
-case class ParquetSchemaWrapper(schema: MessageType) extends SchemaBase {
+class ParquetSchemaWrapper(val schema: MessageType) extends SchemaBase with Serializable {
   override def isEmpty: Boolean = schema.getFields.isEmpty
 }
 
 // Parquet BlockMetaData wrapper
-case class ParquetDataBlock(
-    dataBlock: BlockMetaData,
-    compressCfg: CpuCompressionConfig) extends DataBlockBase {
+class ParquetDataBlock(
+    val dataBlock: BlockMetaData,
+    val compressCfg: CpuCompressionConfig) extends DataBlockBase with Serializable {
   override def getRowCount: Long = dataBlock.getRowCount
   override def getReadDataSize: Long = dataBlock.getTotalByteSize
   override def getBlockSize: Long = {
@@ -2282,13 +2286,13 @@ class ParquetExtraInfo(val dateRebaseMode: DateTimeRebaseMode,
     val hasInt96Timestamps: Boolean) extends ExtraInfo
 
 // contains meta about a single block in a file
-case class ParquetSingleDataBlockMeta(
-  filePath: Path,
-  dataBlock: ParquetDataBlock,
-  partitionValues: InternalRow,
-  schema: ParquetSchemaWrapper,
-  readSchema: StructType,
-  extraInfo: ParquetExtraInfo) extends SingleDataBlockInfo
+class ParquetSingleDataBlockMeta(
+  val filePath: Path,
+  val dataBlock: ParquetDataBlock,
+  val partitionValues: InternalRow,
+  val schema: ParquetSchemaWrapper,
+  val readSchema: StructType,
+  val extraInfo: ParquetExtraInfo) extends SingleDataBlockInfo with Serializable
 
 /**
  * Abstract base class for coalescing Parquet partition readers.
@@ -2676,8 +2680,8 @@ abstract class AbstractMultiFileCloudParquetPartitionReader(
       next.dateRebaseMode,
       current.timestampRebaseMode,
       next.timestampRebaseMode,
-      ParquetSchemaWrapper(current.clippedSchema),
-      ParquetSchemaWrapper(next.clippedSchema),
+      new ParquetSchemaWrapper(current.clippedSchema),
+      new ParquetSchemaWrapper(next.clippedSchema),
       current.partitionedFile.filePath.toString(),
       next.partitionedFile.filePath.toString()
     )
@@ -2916,7 +2920,7 @@ abstract class AbstractMultiFileCloudParquetPartitionReader(
   private class ReadBatchRunner(
       file: PartitionedFile,
       filterFunc: PartitionedFile => ParquetFileInfoWithBlockMeta,
-      taskContext: TaskContext) extends MemoryBoundedAsyncRunner[BufferInfo] with Logging {
+      taskContext: TaskContext) extends MemoryBoundedAsyncRunner[BufferInfo] with RapidsLocalLog {
 
     // Set TaskContext in terms of an AsyncRunner
     override def sparkTaskContext: Option[TaskContext] = Some(taskContext)
@@ -3325,7 +3329,15 @@ class MultiFileCloudParquetPartitionReader(
   }
 }
 
-object MakeParquetTableProducer extends Logging {
+object MakeParquetTableProducer {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
   def apply(
       useChunkedReader: Boolean,
       maxChunkedReaderMemoryUsageSizeBytes: Long,
@@ -3406,7 +3418,7 @@ trait ChunkedReader extends AutoCloseable {
 /**
  * A simple wrapper to adapt the JniParquetChunkedReader to the ChunkedReader interface.
  */
-case class ParquetChunkedReader(delegate: JniParquetChunkedReader) extends ChunkedReader {
+class ParquetChunkedReader(val delegate: JniParquetChunkedReader) extends ChunkedReader {
   override def hasNext: Boolean = delegate.hasNext
   override def next: Table = delegate.readChunk()
   override def close(): Unit = delegate.close()
@@ -3427,7 +3439,7 @@ abstract class AbstractParquetTableReader(
     clippedParquetSchema: MessageType,
     splits: Array[PartitionedFile],
     debugDumpPrefix: Option[String],
-    debugDumpAlways: Boolean) extends GpuDataProducer[Table] with Logging {
+    debugDumpAlways: Boolean) extends GpuDataProducer[Table] with RapidsLocalLog {
 
   protected val reader: ChunkedReader
 
@@ -3500,7 +3512,7 @@ case class ParquetTableReader(
   opts, buffers, metrics, dateRebaseMode, timestampRebaseMode, isSchemaCaseSensitive, useFieldId,
   readDataSchema, clippedParquetSchema, splits, debugDumpPrefix, debugDumpAlways) {
 
-  override protected val reader: ChunkedReader = ParquetChunkedReader(
+  override protected val reader: ChunkedReader = new ParquetChunkedReader(
     new JniParquetChunkedReader(chunkSizeByteLimit, maxChunkedReaderMemoryUsageSizeBytes,
       opts, buffers:_*)
   )
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetUtils.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetUtils.scala
index cc9791a9038..52ab121978e 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetUtils.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/GpuParquetUtils.scala
@@ -24,9 +24,9 @@ import com.nvidia.spark.rapids.shims.parquet.GpuParquetUtilsShims
 import org.apache.parquet.hadoop.metadata.{BlockMetaData, ColumnChunkMetaData, ColumnPath}
 import org.apache.parquet.schema.MessageType
 
-import org.apache.spark.internal.Logging
 
-object GpuParquetUtils extends Logging {
+object GpuParquetUtils {
+
   /**
    * Trim block metadata to contain only the column chunks that occur in the specified schema.
    * The column chunks that are returned are preserved verbatim
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/ParquetCachedBatchSerializer.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/ParquetCachedBatchSerializer.scala
index 5ead8947dfb..d2cb5f4c863 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/ParquetCachedBatchSerializer.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/parquet/ParquetCachedBatchSerializer.scala
@@ -17,7 +17,7 @@
 package com.nvidia.spark.rapids.parquet
 
 import java.io.{InputStream, IOException}
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 
 import scala.collection.JavaConverters._
 import scala.collection.mutable
@@ -95,7 +95,7 @@ private class ByteBufferInputStream(private var buffer: ByteBuffer)
   override def skip(bytes: Long): Long = {
     if (buffer != null) {
       val amountToSkip = math.min(bytes, buffer.remaining).toInt
-      buffer.position(buffer.position() + amountToSkip)
+      buffer.asInstanceOf[Buffer].position(buffer.position() + amountToSkip)
       if (buffer.remaining() == 0) {
         cleanUp()
       }
@@ -128,7 +128,7 @@ class ByteArrayInputFile(buff: Array[Byte]) extends InputFile {
         if (newPos > Int.MaxValue || newPos < Int.MinValue) {
           throw new IllegalStateException("seek value is out of supported range " + newPos)
         }
-        byteBuffer.position(newPos.toInt)
+        byteBuffer.asInstanceOf[Buffer].position(newPos.toInt)
       }
     }
   }
@@ -231,7 +231,7 @@ case class ParquetCachedBatch(
  * Spark wants the producer to close the batch. We have a listener in this iterator that will close
  * the batch after the task is completed
  */
-private case class CloseableColumnBatchIterator(iter: Iterator[ColumnarBatch]) extends
+private class CloseableColumnBatchIterator(val iter: Iterator[ColumnarBatch]) extends
     Iterator[ColumnarBatch] {
   var cb: ColumnarBatch = _
 
@@ -592,7 +592,7 @@ class ParquetCachedBatchSerializer extends GpuCachedBatchSerializer {
           new ColumnarBatch(cols.safeMap(_.copyToHost()).toArray, gpuBatch.numRows())
         }
       })
-      cbRdd.mapPartitions(iter => CloseableColumnBatchIterator(iter))
+      cbRdd.mapPartitions(iter => new CloseableColumnBatchIterator(iter))
     } else {
       val origSelectedAttributesWithUnambiguousNames =
         sanitizeColumnNames(selectedAttributes, selectedSchemaWithNames)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/profiler.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/profiler.scala
index de11a39bcd2..89cd76e5ac1 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/profiler.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/profiler.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,7 +28,6 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.{SparkContext, TaskContext}
 import org.apache.spark.api.plugin.PluginContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.scheduler.{SparkListener, SparkListenerJobEnd, SparkListenerStageCompleted}
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
@@ -38,7 +37,21 @@ import org.apache.spark.util.SerializableConfiguration
  * For profiling with com.nvidia.spark.rapids.jni.Profiler
  */
 
-object ProfilerOnExecutor extends Logging {
+object ProfilerOnExecutor {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = if (log.isInfoEnabled) log.info(msg)
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) log.warn(msg, throwable)
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) log.error(msg, throwable)
+  }
+
   private val jobPattern = raw"SPARK_.*_JId_([0-9]+).*".r
   private var writer: Option[ProfileWriter] = None
   private var timeRanges: Option[Seq[(Long, Long)]] = None
@@ -99,7 +112,7 @@ object ProfilerOnExecutor extends Logging {
         } catch {
           case l: Exception =>
             logWarning("Unable to launch profiler, we will abort profiling session.",l)
-            pluginCtx.send(ProfileErrorMsg(executorId, s"error launching profiler: $l"))
+            pluginCtx.send(new ProfileErrorMsg(executorId, s"error launching profiler: $l"))
             // failed to initialize, lets close the writer, and try to shutdown.
             if (profileWriter != null) {
               Profiler.shutdown()
@@ -188,7 +201,7 @@ object ProfilerOnExecutor extends Logging {
       if (!isProfileActive) {
         Profiler.start()
         isProfileActive = true
-        w.pluginCtx.send(ProfileStatusMsg(w.executorId, "profile started"))
+        w.pluginCtx.send(new ProfileStatusMsg(w.executorId, "profile started"))
       }
     }
   }
@@ -198,7 +211,7 @@ object ProfilerOnExecutor extends Logging {
       if (isProfileActive) {
         Profiler.stop()
         isProfileActive = false
-        w.pluginCtx.send(ProfileStatusMsg(w.executorId, "profile stopped"))
+        w.pluginCtx.send(new ProfileStatusMsg(w.executorId, "profile stopped"))
       }
     }
   }
@@ -290,7 +303,7 @@ object ProfilerOnExecutor extends Logging {
         (activeJobs.toArray, (activeStages ++ stageTaskCount.keys).toArray)
       }
       val (completedJobs, completedStages, allDone) =
-        w.pluginCtx.ask(ProfileJobStageQueryMsg(jobs, stages))
+        w.pluginCtx.ask(new ProfileJobStageQueryMsg(jobs, stages))
           .asInstanceOf[(Array[Int], Array[Int], Boolean)]
       synchronized {
         completedJobs.foreach(activeJobs.remove)
@@ -314,7 +327,11 @@ object ProfilerOnExecutor extends Logging {
 class ProfileWriter(
     val pluginCtx: PluginContext,
     profilePathPrefix: String,
-    codec: Option[CompressionCodec]) extends Profiler.DataWriter with Logging {
+    codec: Option[CompressionCodec]) extends Profiler.DataWriter {
+  @transient private lazy val log = org.slf4j.LoggerFactory.getLogger(classOf[ProfileWriter])
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
   val executorId: String = pluginCtx.executorID()
   private val outPath = getOutputPath(profilePathPrefix, codec)
   private val out = openOutput(codec)
@@ -333,7 +350,7 @@ class ProfileWriter(
       isClosed = true
       out.close()
       logWarning(s"Profiling completed, output written to $outPath")
-      pluginCtx.send(ProfileEndMsg(executorId, outPath.toString))
+      pluginCtx.send(new ProfileEndMsg(executorId, outPath.toString))
     }
   }
 
@@ -355,7 +372,7 @@ class ProfileWriter(
 
   private def openOutput(codec: Option[CompressionCodec]): WritableByteChannel = {
     logWarning(s"Profiler initialized, output will be written to $outPath")
-    val hadoopConf = pluginCtx.ask(ProfileInitMsg(executorId, outPath.toString))
+    val hadoopConf = pluginCtx.ask(new ProfileInitMsg(executorId, outPath.toString))
       .asInstanceOf[SerializableConfiguration].value
     val fs = outPath.getFileSystem(hadoopConf)
     val fsStream = fs.create(outPath, false)
@@ -364,7 +381,15 @@ class ProfileWriter(
   }
 }
 
-object ProfilerOnDriver extends Logging {
+object ProfilerOnDriver {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
+
+  private def logError(msg: => String): Unit = if (log.isErrorEnabled) log.error(msg)
+
   private var hadoopConf: SerializableConfiguration = null
   private var jobRanges: RangeConfMatcher = null
   private var numJobsToProfile: Long = 0L
@@ -404,29 +429,35 @@ object ProfilerOnDriver extends Logging {
   }
 
   def handleMsg(m: ProfileMsg): AnyRef = m match {
-    case ProfileInitMsg(executorId, path) =>
+    case msg: ProfileInitMsg =>
+      val executorId = msg.executorId
+      val path = msg.path
       logWarning(s"Profiling: Executor $executorId initialized profiler, writing to $path")
       if (hadoopConf == null) {
         throw new IllegalStateException("Hadoop configuration not set")
       }
       hadoopConf
-    case ProfileErrorMsg(executorId, msg) =>
+    case msg: ProfileErrorMsg =>
+      val executorId = msg.executorId
+      val errorMsg = msg.msg
       if (profilerErrored) {
-        logDebug(s"Profiling: Error starting profiler from $executorId: $msg")
+        logDebug(s"Profiling: Error starting profiler from $executorId: $errorMsg")
       } else {
-        logError(s"Profiling: Error starting profiler from $executorId: $msg. Suppressing others.")
+        logError(s"Profiling: Error starting profiler from $executorId: $errorMsg. " +
+            "Suppressing others.")
       }
       profilerErrored = true
       null
-    case ProfileStatusMsg(executorId, msg) =>
-      logWarning(s"Profiling: Executor $executorId: $msg")
+    case msg: ProfileStatusMsg =>
+      logWarning(s"Profiling: Executor ${msg.executorId}: ${msg.msg}")
       null
-    case ProfileJobStageQueryMsg(activeJobs, activeStages) =>
-      val filteredJobs = activeJobs.filter(j => completedJobs.containsKey(j))
-      val filteredStages = activeStages.filter(s => completedStages.containsKey(s))
+    case msg: ProfileJobStageQueryMsg =>
+      val filteredJobs = msg.activeJobs.filter(j => completedJobs.containsKey(j))
+      val filteredStages = msg.activeStages.filter(s => completedStages.containsKey(s))
       (filteredJobs, filteredStages, isJobsStageProfilingComplete)
-    case ProfileEndMsg(executorId, path) =>
-      logWarning(s"Profiling: Executor $executorId ended profiling, profile written to $path")
+    case msg: ProfileEndMsg =>
+      logWarning(s"Profiling: Executor ${msg.executorId} ended profiling, " +
+          s"profile written to ${msg.path}")
       null
     case _ =>
       throw new IllegalStateException(s"Unexpected profile msg: $m")
@@ -453,17 +484,7 @@ object ProfilerOnDriver extends Logging {
   }
 }
 
-trait ProfileMsg
-
-case class ProfileInitMsg(executorId: String, path: String) extends ProfileMsg
-case class ProfileStatusMsg(executorId: String, msg: String) extends ProfileMsg
-case class ProfileErrorMsg(executorId: String, msg: String) extends ProfileMsg
-case class ProfileEndMsg(executorId: String, path: String) extends ProfileMsg
-
-// Reply is a tuple of:
+// Reply to ProfileJobStageQueryMsg is a tuple of:
 // - array of jobs that have completed
 // - array of stages that have completed
 // - boolean if there are no further jobs/stages to profile
-case class ProfileJobStageQueryMsg(
-    activeJobs: Array[Int],
-    activeStages: Array[Int]) extends ProfileMsg
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/GpuPythonArguments.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/GpuPythonArguments.scala
index 10ecb3fbece..2f33689d784 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/GpuPythonArguments.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/GpuPythonArguments.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -27,11 +27,11 @@ import org.apache.spark.sql.types.DataType
  * @param argOffsets The offsets of the original arguments in "flattenedArgs"
  * @param argNames The optional argument names
  */
-case class GpuPythonArguments(
-    flattenedArgs: Seq[Expression],
-    flattenedTypes: Seq[DataType],
-    argOffsets: Array[Array[Int]],
-    argNames: Option[Array[Array[Option[String]]]])
+class GpuPythonArguments(
+    val flattenedArgs: Seq[Expression],
+    val flattenedTypes: Seq[DataType],
+    val argOffsets: Array[Array[Int]],
+    val argNames: Option[Array[Array[Option[String]]]])
 
 /** Gpu version of ArgumentMetadata */
-case class GpuArgumentMeta(offset: Int, name: Option[String])
+class GpuArgumentMeta(val offset: Int, val name: Option[String])
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/PythonWorkerSemaphore.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/PythonWorkerSemaphore.scala
index 521b3340154..844f5453d60 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/PythonWorkerSemaphore.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/python/PythonWorkerSemaphore.scala
@@ -26,7 +26,6 @@ import com.nvidia.spark.rapids.python.PythonConfEntries.CONCURRENT_PYTHON_WORKER
 import org.apache.commons.lang3.mutable.MutableInt
 
 import org.apache.spark.{SparkEnv, TaskContext}
-import org.apache.spark.internal.Logging
 
 /*
  * PythonWorkerSemaphore is used to limit the number of Python workers(processes) to be started
@@ -41,7 +40,15 @@ import org.apache.spark.internal.Logging
  * the inner semaphore when no longer needed.
  *
  */
-object PythonWorkerSemaphore extends Logging {
+object PythonWorkerSemaphore {
+  private val log = org.slf4j.LoggerFactory.getLogger(
+    "com.nvidia.spark.rapids.python.PythonWorkerSemaphore")
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
 
   private lazy val rapidsConf = new RapidsConf(SparkEnv.get.conf)
   private lazy val workersPerGpu = rapidsConf.get(CONCURRENT_PYTHON_WORKERS)
@@ -97,7 +104,15 @@ object PythonWorkerSemaphore extends Logging {
   }
 }
 
-private final class PythonWorkerSemaphore(tasksPerGpu: Int) extends Logging {
+private final class PythonWorkerSemaphore(tasksPerGpu: Int) {
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[PythonWorkerSemaphore])
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
   private val semaphore = new Semaphore(tasksPerGpu)
   // Map to track which tasks have acquired the semaphore.
   private val activeTasks = new ConcurrentHashMap[Long, MutableInt]
diff --git a/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala
similarity index 82%
rename from sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala
rename to sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala
index c45dd68118b..664d6a82c38 100644
--- a/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BloomFilterConstantsShims.scala
@@ -14,11 +14,11 @@
  * limitations under the License.
  */
 
-/*** spark-rapids-shim-json-lines
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
+import com.nvidia.spark.rapids.VersionUtils
+
 object BloomFilterConstantsShims {
-  val BLOOM_FILTER_FORMAT_VERSION: Int = 2
+  val BLOOM_FILTER_FORMAT_VERSION: Int =
+    if (VersionUtils.cmpSparkVersion(4, 1, 0) >= 0) 2 else 1
 }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BloomFilterShims.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BloomFilterShims.scala
index fe6306ec47e..ba9bb96af27 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BloomFilterShims.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BloomFilterShims.scala
@@ -41,14 +41,14 @@ object BloomFilterShims {
         }),
       GpuOverrides.expr[BloomFilterAggregate](
         "Bloom filter build",
-        ExprChecksImpl(Map(
+        new ExprChecksImpl(Map(
           (ReductionAggExprContext,
-            ContextChecks(TypeSig.BINARY, TypeSig.BINARY,
-              Seq(ParamCheck("child", TypeSig.LONG, TypeSig.LONG),
-                ParamCheck("estimatedItems",
+            new ContextChecks(TypeSig.BINARY, TypeSig.BINARY,
+              Seq(new ParamCheck("child", TypeSig.LONG, TypeSig.LONG),
+                new ParamCheck("estimatedItems",
                   TypeSig.lit(TypeEnum.LONG), TypeSig.lit(TypeEnum.LONG)),
-                ParamCheck("numBits",
-                  TypeSig.lit(TypeEnum.LONG), TypeSig.lit(TypeEnum.LONG))))))),
+                new ParamCheck("numBits",
+                  TypeSig.lit(TypeEnum.LONG), TypeSig.lit(TypeEnum.LONG))), None)))),
         (a, conf, p, r) => new TypedImperativeAggExprMeta[BloomFilterAggregate](a, conf, p, r) {
           private lazy val estimatedNumItems =
             GpuBloomFilterAggregate.clampEstimatedNumItems(
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BucketingUtilsShim.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BucketingUtilsShim.scala
index d1844867760..7d55a011dcf 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BucketingUtilsShim.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/BucketingUtilsShim.scala
@@ -43,7 +43,7 @@ object BucketingUtilsShim {
         // table and a normal one.
         val bucketIdExpression = GpuHashPartitioning(bucketColumns, spec.numBuckets)
           .partitionIdExpression
-        GpuWriterBucketSpec(bucketIdExpression, (_: Int) => "")
+        new GpuWriterBucketSpec(bucketIdExpression, (_: Int) => "")
       }
     }
   }
diff --git a/sql-plugin/src/main/spark350db143/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala
similarity index 69%
rename from sql-plugin/src/main/spark350db143/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala
rename to sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala
index 5c529226fea..19c3d55cc6d 100644
--- a/sql-plugin/src/main/spark350db143/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala
@@ -13,18 +13,16 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-/*** spark-rapids-shim-json-lines
-{"spark": "350db143"}
-{"spark": "400"}
-{"spark": "400db173"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
+
 package com.nvidia.spark.rapids.shims
 
+import com.nvidia.spark.rapids.VersionUtils
+
 object CastTimeToIntShim {
-  // From 400, rows overflow will be set to nulls when casting timestamps to integrals,
+  // Whether to set overflow rows to nulls when casting timestamps to integrals,
   // when ANSI is disabled.
-  def ifNullifyOverflows: Boolean = true
+  def ifNullifyOverflows: Boolean = {
+    VersionUtils.cmpSparkVersion(4, 0, 0) >= 0 ||
+      (VersionUtils.isDataBricks && VersionUtils.cmpSparkVersion(3, 5, 0) == 0)
+  }
 }
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala
similarity index 82%
rename from sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala
rename to sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala
index 94e0b85ab64..974999a48af 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala
@@ -14,34 +14,6 @@
  * limitations under the License.
  */
 
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-{"spark": "340"}
-{"spark": "341"}
-{"spark": "341db"}
-{"spark": "342"}
-{"spark": "343"}
-{"spark": "344"}
-{"spark": "350"}
-{"spark": "350db143"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-{"spark": "400"}
-{"spark": "401"}
-{"spark": "402"}
-spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
 import com.nvidia.spark.rapids._
@@ -52,9 +24,7 @@ import org.apache.spark.sql.rapids._
 import org.apache.spark.sql.rapids.shims.{GpuDivideDTInterval, GpuMultiplyDTInterval}
 
 object DayTimeIntervalShims {
-  def exprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = 
-    // TimeAdd moved to TimeAddShims to handle version differences
-    TimeAddShims.exprs ++ Seq(
+  def exprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = Seq(
     GpuOverrides.expr[Abs](
       "Absolute value",
       ExprChecks.unaryProjectAndAstInputMatchesOutput(
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala
similarity index 59%
rename from sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala
rename to sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala
index 95bc2097f53..fc29946b71e 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala
@@ -14,32 +14,26 @@
  * limitations under the License.
  */
 
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-{"spark": "340"}
-{"spark": "341"}
-{"spark": "341db"}
-{"spark": "350"}
-spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
 import ai.rapids.cudf.{ColumnView, Table}
+import com.nvidia.spark.rapids.VersionUtils
 import com.nvidia.spark.rapids.jni.DecimalUtils._
 
 object DecimalMultiply128 {
+  private def useFinalPrecisionScaleMultiply: Boolean = {
+    VersionUtils.cmpSparkVersion(4, 0, 0) >= 0 ||
+      VersionUtils.cmpSparkVersion(3, 5, 1) >= 0 ||
+      (VersionUtils.cmpSparkVersion(3, 4, 2) >= 0 &&
+        VersionUtils.cmpSparkVersion(3, 5, 0) < 0) ||
+      (VersionUtils.isDataBricks && VersionUtils.cmpSparkVersion(3, 5, 0) == 0)
+  }
+
   def apply(castLhs: ColumnView, castRhs: ColumnView, scale: Int): Table = {
-    /**
-     * We are calling multiply128 that casts the interim result to a 38 precision before casting to
-     * the final precision and scale.
-     * This version of multiplying 128-bits should only be used for versions of Spark before 3.4.2,
-     * 4.0.0, 3.5.1
-     */
-    multiply128(castLhs, castRhs, scale)
+    if (useFinalPrecisionScaleMultiply) {
+      multiply128(castLhs, castRhs, scale, false)
+    } else {
+      multiply128(castLhs, castRhs, scale)
+    }
   }
 }
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala
similarity index 85%
rename from sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala
rename to sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala
index fa10aa6e489..7b087eecfa6 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala
@@ -14,15 +14,10 @@
  * limitations under the License.
  */
 
-/*** spark-rapids-shim-json-lines
-{"spark": "400"}
-{"spark": "400db173"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
+import com.nvidia.spark.rapids.VersionUtils
+
 object GetJsonObjectShim {
   /**
    * Return a shim string for a part in named Regexp.
@@ -35,5 +30,11 @@ object GetJsonObjectShim {
    * "[^\\'\\?]+" : One or more chars which are not: ' or ?
    * "[^\\']+"    : One or more chars which are not: '
    */
-  def partRegexpInNamed: String = "[^\\']+"
+  def partRegexpInNamed: String = {
+    if (VersionUtils.cmpSparkVersion(4, 0, 0) >= 0) {
+      "[^\\']+"
+    } else {
+      "[^\\'\\?]+"
+    }
+  }
 }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader320Plus.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader320Plus.scala
index fb4678f6cc6..eb162cace62 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader320Plus.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader320Plus.scala
@@ -16,7 +16,7 @@
 package com.nvidia.spark.rapids.shims
 
 import java.io.EOFException
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 import java.nio.channels.SeekableByteChannel
 
 import ai.rapids.cudf.HostMemoryBuffer
@@ -43,8 +43,8 @@ abstract class GpuOrcDataReader320Plus(
       val offset = current.getOffset
       while (current ne last.next) {
         val buffer = if (current eq last) data else data.duplicate()
-        buffer.position((current.getOffset - offset).toInt)
-        buffer.limit((current.getEnd - offset).toInt)
+        buffer.asInstanceOf[Buffer].position((current.getOffset - offset).toInt)
+        buffer.asInstanceOf[Buffer].limit((current.getEnd - offset).toInt)
         current.asInstanceOf[BufferChunk].setChunk(buffer)
         // see if the filecache wants any of this data
         val cacheToken = FileCache.get.startDataRangeCache(inputFile,
@@ -75,7 +75,7 @@ abstract class GpuOrcDataReader320Plus(
           throw new EOFException(s"Unexpected EOF while reading cached block for $filePathString")
         }
       }
-      buffer.flip()
+      buffer.asInstanceOf[Buffer].flip()
       chunk.asInstanceOf[BufferChunk].setChunk(buffer)
       chunk
     }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReaderBase.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReaderBase.scala
index df62a38b241..32a25b7d775 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReaderBase.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReaderBase.scala
@@ -16,7 +16,7 @@
 package com.nvidia.spark.rapids.shims
 
 import java.io.{EOFException, IOException}
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 import java.nio.channels.SeekableByteChannel
 
 import ai.rapids.cudf.HostMemoryBuffer
@@ -24,6 +24,7 @@ import com.nvidia.spark.rapids.{GpuMetric, HostMemoryOutputStream, NoopMetric}
 import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.filecache.FileCache
 import com.nvidia.spark.rapids.fileio.hadoop.HadoopFileIO
+import com.nvidia.spark.rapids.fileio.hadoop.PerfIOHadoopInputFileFactory
 import com.nvidia.spark.rapids.jni.fileio.RapidsInputFile
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.FSDataInputStream
@@ -37,7 +38,9 @@ abstract class GpuOrcDataReaderBase(
     metrics: Map[String, GpuMetric]) extends DataReader {
   protected val filePathString = props.getPath.toString
   protected var file: Option[FSDataInputStream] = None
-  protected lazy val fileIO = new HadoopFileIO(conf)
+  protected lazy val fileIO = new HadoopFileIO(
+    conf,
+    PerfIOHadoopInputFileFactory.INSTANCE)
   protected lazy val inputFile: RapidsInputFile = fileIO.newInputFile(filePathString)
   protected val compression = props.getCompression
   private val hitMetric = getMetric(GpuMetric.FILECACHE_DATA_RANGE_HITS)
@@ -116,7 +119,7 @@ abstract class GpuOrcDataReaderBase(
               throw new EOFException("Unexpected EOF while reading stripe footer")
             }
           }
-          tailBuf.flip()
+          tailBuf.asInstanceOf[Buffer].flip()
         }
       }
     } else {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala
new file mode 100644
index 00000000000..94054ce4e3e
--- /dev/null
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala
@@ -0,0 +1,75 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package com.nvidia.spark.rapids.shims
+
+import java.lang.reflect.{InvocationTargetException, Method}
+
+import com.nvidia.spark.rapids.{GpuExec, GpuWrite}
+
+import org.apache.spark.sql.execution.SparkPlan
+
+object ReplaceDataExecShim {
+  private val gpuReplaceDataExecCompanion =
+    "org.apache.spark.sql.execution.datasources.v2.GpuReplaceDataExec$"
+
+  def convertToGpu(
+      cpuExec: AnyRef,
+      childPlan: SparkPlan,
+      gpuWrite: GpuWrite): GpuExec = {
+    val refreshCache = invokeNoArg(cpuExec, "refreshCache")
+    val companion = Class.forName(gpuReplaceDataExecCompanion).getField("MODULE$").get(null)
+    maybeInvokeNoArg(cpuExec, "projections") match {
+      case Some(projections) =>
+        invokeApply(companion, 4, childPlan, refreshCache, projections, gpuWrite)
+      case None =>
+        invokeApply(companion, 3, childPlan, refreshCache, gpuWrite)
+    }
+  }
+
+  private def maybeInvokeNoArg(target: AnyRef, methodName: String): Option[AnyRef] = {
+    try {
+      Some(invokeNoArg(target, methodName))
+    } catch {
+      case _: NoSuchMethodException => None
+    }
+  }
+
+  private def invokeNoArg(target: AnyRef, methodName: String): AnyRef = {
+    invoke(target.getClass.getMethod(methodName), target)
+  }
+
+  private def invokeApply(
+      companion: AnyRef,
+      parameterCount: Int,
+      args: AnyRef*): GpuExec = {
+    val method = companion.getClass.getMethods.find { method =>
+      method.getName == "apply" && method.getParameterCount == parameterCount
+    }.getOrElse {
+      throw new NoSuchMethodException(
+        s"GpuReplaceDataExec.apply with $parameterCount parameters")
+    }
+    invoke(method, companion, args: _*).asInstanceOf[GpuExec]
+  }
+
+  private def invoke(method: Method, target: AnyRef, args: AnyRef*): AnyRef = {
+    try {
+      method.invoke(target, args: _*)
+    } catch {
+      case e: InvocationTargetException =>
+        throw e.getCause
+    }
+  }
+}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark320PlusShims.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark320PlusShims.scala
index d3d0a8fd88f..c8c71a3e553 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark320PlusShims.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark320PlusShims.scala
@@ -21,7 +21,6 @@ import scala.annotation.nowarn
 import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.GpuOverrides.exec
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.{InternalRow, TableIdentifier}
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.expressions.aggregate.Average
@@ -51,7 +50,7 @@ import org.apache.spark.sql.rapids.shims.TrampolineConnectShims.SparkSession
  * Shim base class that can be compiled with every supported 3.2.0+
  */
 trait Spark320PlusShims extends SparkShims with RebaseShims
-    with WindowInPandasShims with Logging {
+    with WindowInPandasShims {
 
 
   override final def aqeShuffleReaderExec: ExecRule[_ <: SparkPlan] = exec[AQEShuffleReadExec](
@@ -136,7 +135,7 @@ trait Spark320PlusShims extends SparkShims with RebaseShims
         TypeSig.DOUBLE + TypeSig.DECIMAL_128,
         // NullType is not technically allowed by Spark, but in practice in 3.2.0
         // it can show up
-        Seq(ParamCheck("input",
+        Seq(new ParamCheck("input",
           TypeSig.integral + TypeSig.fp + TypeSig.DECIMAL_128 + TypeSig.NULL,
           TypeSig.numericAndInterval + TypeSig.NULL))),
       (a, conf, p, r) => new AggExprMeta[Average](a, conf, p, r) {
@@ -184,11 +183,11 @@ trait Spark320PlusShims extends SparkShims with RebaseShims
         TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral + TypeSig.DAYTIME,
         TypeSig.numericAndInterval,
         Seq(
-          ParamCheck("lower",
+          new ParamCheck("lower",
             TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral + TypeSig.DAYTIME
               + TypeSig.DECIMAL_128 + TypeSig.FLOAT + TypeSig.DOUBLE,
             TypeSig.numericAndInterval),
-          ParamCheck("upper",
+          new ParamCheck("upper",
             TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral + TypeSig.DAYTIME
               + TypeSig.DECIMAL_128 + TypeSig.FLOAT + TypeSig.DOUBLE,
             TypeSig.numericAndInterval))),
@@ -199,8 +198,8 @@ trait Spark320PlusShims extends SparkShims with RebaseShims
       ExprChecks.windowOnly(
         TypeSig.all,
         TypeSig.all,
-        Seq(ParamCheck("windowFunction", TypeSig.all, TypeSig.all),
-          ParamCheck("windowSpec",
+        Seq(new ParamCheck("windowFunction", TypeSig.all, TypeSig.all),
+          new ParamCheck("windowSpec",
             TypeSig.CALENDAR + TypeSig.NULL + TypeSig.integral + TypeSig.DECIMAL_64 +
               TypeSig.DAYTIME, TypeSig.numericAndInterval))),
       (windowExpression, conf, p, r) => new GpuWindowExpressionMeta(windowExpression, conf, p, r))
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark321PlusShims.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark321PlusShims.scala
index 777e1a5ccc6..fc7dc662e28 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark321PlusShims.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/Spark321PlusShims.scala
@@ -18,14 +18,13 @@ package com.nvidia.spark.rapids.shims
 
 import org.apache.parquet.schema.MessageType
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.execution.datasources._
 import org.apache.spark.sql.execution.datasources.parquet.ParquetFilters
 
 /**
  * Shim base class that can be compiled with every supported 3.2.1+
  */
-trait Spark321PlusShims extends Spark320PlusShims with RebaseShims with Logging {
+trait Spark321PlusShims extends Spark320PlusShims with RebaseShims {
   override def getParquetFilters(
       schema: MessageType,
       pushDownDate: Boolean,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
new file mode 100644
index 00000000000..15b1891ae46
--- /dev/null
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
@@ -0,0 +1,49 @@
+/*
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package com.nvidia.spark.rapids.shims
+
+import java.lang.reflect.InvocationTargetException
+
+import org.apache.spark.sql.catalyst.expressions.Expression
+
+object TryModeShim {
+  private val TryModeName = "TRY"
+
+  def isTryMode(expr: Expression): Boolean = {
+    evalMode(expr).exists(mode => String.valueOf(mode) == TryModeName)
+  }
+
+  private def evalMode(expr: Expression): Option[AnyRef] = {
+    invokeNoArg(expr, "evalMode").orElse {
+      invokeNoArg(expr, "evalContext").flatMap(invokeNoArg(_, "evalMode"))
+    }
+  }
+
+  private def invokeNoArg(target: AnyRef, methodName: String): Option[AnyRef] = {
+    try {
+      val method = target.getClass.getMethod(methodName)
+      Option(method.invoke(target).asInstanceOf[AnyRef])
+    } catch {
+      case _: NoSuchMethodException =>
+        None
+      case e: InvocationTargetException if e.getCause != null =>
+        throw e.getCause
+      case _: IllegalAccessException =>
+        None
+    }
+  }
+}
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/gpuWindows.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/gpuWindows.scala
index 3c324433183..6e2670098bf 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/gpuWindows.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/gpuWindows.scala
@@ -69,7 +69,7 @@ object GpuWindowUtil {
     case GpuLiteral(value, _: DayTimeIntervalType) =>
       var x = value.asInstanceOf[Long]
       if (x == Long.MinValue) x = Long.MaxValue
-      ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
+      new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
     case anything => throw new UnsupportedOperationException("Unsupported window frame" +
       s" expression $anything")
   }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/parquet/ParquetSchemaClipShims.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/parquet/ParquetSchemaClipShims.scala
index d91679a7ef4..87ccb7589b1 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/parquet/ParquetSchemaClipShims.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shims/parquet/ParquetSchemaClipShims.scala
@@ -107,7 +107,7 @@ object ParquetSchemaClipShims {
       val scale = decimalLogicalTypeAnnotation.getScale
 
       if (!(maxPrecision == -1 || 1 <= precision && precision <= maxPrecision)) {
-        throw new RapidsAnalysisException(s"Invalid decimal precision: $typeName " +
+        throw RapidsAnalysisException(s"Invalid decimal precision: $typeName " +
             s"cannot store $precision digits (max $maxPrecision)")
       }
 
@@ -166,14 +166,14 @@ object ParquetSchemaClipShims {
               ParquetTimestampAnnotationShims.timestampTypeForMillisOrMicros(timestamp)
           case timestamp: TimestampLogicalTypeAnnotation if timestamp.getUnit == TimeUnit.NANOS &&
               ParquetLegacyNanoAsLongShims.legacyParquetNanosAsLong =>
-            throw new RapidsAnalysisException(
+            throw RapidsAnalysisException(
               "GPU does not support spark.sql.legacy.parquet.nanosAsLong")
           case _ => illegalType()
         }
 
       case INT96 =>
         if (!SQLConf.get.isParquetINT96AsTimestamp) {
-          throw new RapidsAnalysisException(
+          throw RapidsAnalysisException(
             "INT96 is not supported unless it's interpreted as timestamp. " +
               s"Please try to set ${SQLConf.PARQUET_INT96_AS_TIMESTAMP.key} to true.")
         }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BounceBufferManager.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BounceBufferManager.scala
index 0475aa6b6db..98c2f206de1 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BounceBufferManager.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BounceBufferManager.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -20,7 +20,6 @@ import java.util
 
 import ai.rapids.cudf.MemoryBuffer
 
-import org.apache.spark.internal.Logging
 
 /**
  * Class to hold a bounce buffer reference in `buffer`.
@@ -53,9 +52,9 @@ abstract class BounceBuffer(val buffer: MemoryBuffer) extends AutoCloseable {
  * @param deviceBounceBuffer - device buffer to use for sends
  * @param hostBounceBuffer - optional host buffer to use for sends
  */
-case class SendBounceBuffers(
-    deviceBounceBuffer: BounceBuffer,
-    hostBounceBuffer: Option[BounceBuffer]) extends AutoCloseable {
+class SendBounceBuffers(
+    val deviceBounceBuffer: BounceBuffer,
+    val hostBounceBuffer: Option[BounceBuffer]) extends AutoCloseable with Serializable {
 
   def bounceBufferSize: Long = {
     deviceBounceBuffer.buffer.getLength
@@ -82,8 +81,22 @@ class BounceBufferManager[T <: MemoryBuffer](
     val bufferSize: Long,
     val numBuffers: Int,
     allocator: Long => T)
-  extends AutoCloseable
-  with Logging {
+  extends AutoCloseable {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(
+    "com.nvidia.spark.rapids.shuffle.BounceBufferManager")
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logTrace(msg: => String): Unit = {
+    if (log.isTraceEnabled) {
+      log.trace(msg)
+    }
+  }
 
   class BounceBufferImpl(buff: MemoryBuffer) extends BounceBuffer(buff) {
     override def free(bb: BounceBuffer): Unit = {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferReceiveState.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferReceiveState.scala
index 60d3b13de37..d05da04a589 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferReceiveState.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferReceiveState.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -26,12 +26,11 @@ import com.nvidia.spark.rapids.NvtxRegistry
 import com.nvidia.spark.rapids.format.TableMeta
 import com.nvidia.spark.rapids.jni.RmmSpark
 
-import org.apache.spark.internal.Logging
 
-case class ConsumedBatchFromBounceBuffer(
-    contigBuffer: DeviceMemoryBuffer,
-    meta: TableMeta,
-    handler: RapidsShuffleFetchHandler)
+class ConsumedBatchFromBounceBuffer(
+    val contigBuffer: DeviceMemoryBuffer,
+    val meta: TableMeta,
+    val handler: RapidsShuffleFetchHandler) extends Serializable
 
 /**
  * A helper case class to maintain the state associated with a transfer request to a peer.
@@ -59,7 +58,21 @@ class BufferReceiveState(
     requests: Seq[PendingTransferRequest],
     transportOnClose: () => Unit,
     stream: Cuda.Stream = Cuda.DEFAULT_STREAM)
-    extends AutoCloseable with Logging {
+    extends AutoCloseable {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[BufferReceiveState])
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
 
   val transportBuffer = new CudfTransportBuffer(bounceBuffer.buffer)
   // we use this to keep a list (should be depth 1) of "requests for receives"
@@ -223,7 +236,7 @@ class BufferReceiveState(
           }
 
           if (contigBuffer != null) {
-            Some(ConsumedBatchFromBounceBuffer(
+            Some(new ConsumedBatchFromBounceBuffer(
               contigBuffer, pendingTransferRequest.tableMeta, pendingTransferRequest.handler))
           } else {
             None
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferSendState.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferSendState.scala
index 0a7942bd581..22f5655680e 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferSendState.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/BufferSendState.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,7 +22,6 @@ import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.format.{BufferMeta, BufferTransferRequest}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.rapids.RapidsShuffleSendPrepareException
 
 /**
@@ -56,7 +55,21 @@ class BufferSendState(
     sendBounceBuffers: SendBounceBuffers,
     requestHandler: RapidsShuffleRequestHandler,
     serverStream: Cuda.Stream = Cuda.DEFAULT_STREAM)
-    extends AutoCloseable with Logging {
+    extends AutoCloseable {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[BufferSendState])
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
 
   class SendBlock(val bufferHandle: RapidsShuffleHandle) extends BlockWithSize {
     // we assume that the size of the buffer won't change as it goes to host/disk
@@ -148,8 +161,8 @@ class BufferSendState(
     }
   }
 
-  case class RangeBuffer(
-      range: BlockRange[SendBlock], rapidsBuffer: MemoryBuffer)
+  private class RangeBuffer(
+      val range: BlockRange[SendBlock], val rapidsBuffer: MemoryBuffer)
       extends AutoCloseable {
     override def close(): Unit = {
       rapidsBuffer.close()
@@ -189,7 +202,7 @@ class BufferSendState(
               case _ =>
                 hostBuffs += blockRange.rangeSize()
             }
-            RangeBuffer(blockRange, buff)
+            new RangeBuffer(blockRange, buff)
           }
 
           logDebug(s"Occupancy for bounce buffer is " +
@@ -201,7 +214,9 @@ class BufferSendState(
             hostBounceBuffer.buffer
           }
 
-          acquiredBuffs.foreach { case RangeBuffer(blockRange, memoryBuffer) =>
+          acquiredBuffs.foreach { rangeBuffer =>
+            val blockRange = rangeBuffer.range
+            val memoryBuffer = rangeBuffer.rapidsBuffer
             needsCleanup = true
             require(blockRange.rangeSize() <= bounceBuffToUse.getLength - buffOffset)
             bounceBuffToUse.copyFromMemoryBufferAsync(
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClient.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClient.scala
index 5498dd890c4..7bc24b6c343 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClient.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClient.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -25,7 +25,6 @@ import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.format.{MetadataResponse, TableMeta, TransferState}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.GpuShuffleEnv
 import org.apache.spark.storage.ShuffleBlockBatchId
 
@@ -70,9 +69,9 @@ trait RapidsShuffleFetchHandler {
  * @param tableMeta shuffle metadata describing the table
  * @param handler a specific handler that is waiting for this batch
  */
-case class PendingTransferRequest(client: RapidsShuffleClient,
-                                  tableMeta: TableMeta,
-                                  handler: RapidsShuffleFetchHandler) {
+class PendingTransferRequest(val client: RapidsShuffleClient,
+                             val tableMeta: TableMeta,
+                             val handler: RapidsShuffleFetchHandler) extends Serializable {
   val getLength: Long = tableMeta.bufferMeta.size()
 }
 
@@ -98,7 +97,28 @@ class RapidsShuffleClient(
     exec: Executor,
     clientCopyExecutor: Executor,
     catalog: ShuffleReceivedBufferCatalog = GpuShuffleEnv.getReceivedCatalog)
-      extends Logging with AutoCloseable {
+      extends AutoCloseable {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[RapidsShuffleClient])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   // these are handlers that are interested (live spark tasks) in peer failure handling
   private val liveHandlers =
@@ -338,7 +358,7 @@ class RapidsShuffleClient(
       // We check the uncompressedSize to make sure we don't request a 0-sized buffer
       // from a peer. We treat such a corner case as a degenerate batch
       if (tableMeta.bufferMeta() != null && tableMeta.bufferMeta().uncompressedSize() > 0) {
-        ptrs += PendingTransferRequest(
+        ptrs += new PendingTransferRequest(
           this,
           tableMeta,
           handler)
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServer.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServer.scala
index 8d7817da595..430a59b6888 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServer.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServer.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -25,7 +25,6 @@ import com.nvidia.spark.rapids.{NvtxRegistry, RapidsConf, RapidsShuffleHandle, S
 import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.format.TableMeta
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.rapids.RapidsShuffleSendPrepareException
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.storage.{BlockManagerId, ShuffleBlockBatchId}
@@ -74,7 +73,40 @@ class RapidsShuffleServer(transport: RapidsShuffleTransport,
                           requestHandler: RapidsShuffleRequestHandler,
                           exec: Executor,
                           bssExec: Executor,
-                          rapidsConf: RapidsConf) extends AutoCloseable with Logging {
+                          rapidsConf: RapidsConf) extends AutoCloseable {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[RapidsShuffleServer])
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logTrace(msg: => String): Unit = {
+    if (log.isTraceEnabled) {
+      log.trace(msg)
+    }
+  }
+
+  private def logError(msg: => String): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg)
+    }
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg, throwable)
+    }
+  }
+
 
   def getId: BlockManagerId = {
     // upon seeing this port, the other side will try to connect to the port
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTransport.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTransport.scala
index ef45bf5059d..5c468f75d88 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTransport.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTransport.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -16,14 +16,13 @@
 
 package com.nvidia.spark.rapids.shuffle
 
-import java.nio.{ByteBuffer, ByteOrder}
+import java.nio.{Buffer, ByteBuffer, ByteOrder}
 import java.util.concurrent.ConcurrentLinkedQueue
 import java.util.concurrent.atomic.AtomicInteger
 
 import ai.rapids.cudf.MemoryBuffer
 import com.nvidia.spark.rapids.{NvtxRegistry, RapidsConf, ShimReflectionUtils}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.storage.RapidsStorageUtils
 import org.apache.spark.storage.BlockManagerId
 
@@ -156,20 +155,6 @@ object TransactionStatus extends Enumeration {
   val NotStarted, InProgress, Complete, Success, Error, Cancelled = Value
 }
 
-/**
- * Case class representing stats for the a transaction
- * @param txTimeMs amount of time this [[Transaction]] took
- * @param sendSize amount of bytes sent
- * @param receiveSize amount of bytes received
- * @param sendThroughput send throughput in GB/sec
- * @param recvThroughput receive throughput in GB/sec
- */
-case class TransactionStats(txTimeMs: Double,
-                            sendSize: Long,
-                            receiveSize: Long,
-                            sendThroughput: Double,
-                            recvThroughput: Double)
-
 /**
  * TransportBuffer represents a buffer with an address and length.
  *
@@ -194,7 +179,7 @@ class MetadataTransportBuffer(val dbb: RefCountedDirectByteBuffer) extends Trans
   def copy(in: ByteBuffer): Unit = {
     val bb = dbb.getBuffer()
     bb.put(in)
-    bb.rewind()
+    bb.asInstanceOf[Buffer].rewind()
   }
 
   override def getAddress(): Long =
@@ -400,7 +385,15 @@ trait RapidsShuffleTransport extends AutoCloseable {
  *
  * @param bufferSize the size of direct `ByteBuffer` to allocate.
  */
-class DirectByteBufferPool(bufferSize: Long) extends Logging {
+class DirectByteBufferPool(bufferSize: Long) {
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[DirectByteBufferPool])
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
   val buffers = new ConcurrentLinkedQueue[ByteBuffer]()
   val high = new AtomicInteger(0)
 
@@ -415,7 +408,7 @@ class DirectByteBufferPool(bufferSize: Long) extends Logging {
       logDebug(s"Allocating new direct buffer, high watermark = $high")
       new RefCountedDirectByteBuffer(ByteBuffer.allocateDirect(bufferSize.toInt), Option(this))
     } else {
-      buff.clear()
+      buff.asInstanceOf[Buffer].clear()
       // Reset endianness to BIG_ENDIAN, as it could have changed depending on the consumer
       // (i.e. flat buffers force byte order to be LITTLE_ENDIAN, but pool consumers could be
       //  things like handshake messages that don't use flat buffers).
@@ -430,7 +423,7 @@ class DirectByteBufferPool(bufferSize: Long) extends Logging {
 
   def releaseBuffer(buff: RefCountedDirectByteBuffer): Boolean = {
     logDebug(s"Free direct buffers ${buffers.size()}")
-    buff.getBuffer().clear()
+    buff.getBuffer().asInstanceOf[Buffer].clear()
     buffers.offer(buff.getBuffer())
   }
 }
@@ -531,7 +524,7 @@ object TransportUtils {
     NvtxRegistry.TRANSPORT_COPY_BUFFER.push()
     try {
       val ro = src.asReadOnlyBuffer()
-      ro.limit(ro.position() + size) // make sure we only copy size bytes
+      ro.asInstanceOf[Buffer].limit(ro.position() + size) // make sure we only copy size bytes
       // copy from position to remaining = (limit - position)
       dst.put(ro) // bulk put
     } finally {
@@ -550,7 +543,16 @@ object TransportUtils {
   }
 }
 
-object RapidsShuffleTransport extends Logging {
+object RapidsShuffleTransport {
+  private val log = org.slf4j.LoggerFactory.getLogger(
+    "com.nvidia.spark.rapids.shuffle.RapidsShuffleTransport")
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg, throwable)
+    }
+  }
+
   /**
    * Used in `BlockManagerId`s when returning a map status after a shuffle write to
    * let the readers know what TCP port to use to establish a transport connection.
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIterator.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIterator.scala
index 2fdce9862ad..9ba96c2bf5c 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIterator.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIterator.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,37 +18,6 @@ package com.nvidia.spark.rapids.shuffle
 
 import scala.collection.mutable.ArrayBuffer
 
-// Helper trait that callers can use to add blocks to the iterator
-// as long as they can provide a size
-trait BlockWithSize {
-  /**
-   * Abstract method to return the size in bytes of this block
-   * @return Long - size in bytes
-   */
-  def size: Long
-}
-
-/**
- * Specifies a start and end range of bytes for a block.
- * @param block - a BlockWithSize instance
- * @param rangeStart - byte offset for the start of the range (inclusive)
- * @param rangeEnd - byte offset for the end of the range (exclusive)
- * @tparam T - the specific type of `BlockWithSize`
- */
-case class BlockRange[T <: BlockWithSize](
-    block: T, rangeStart: Long, rangeEnd: Long) {
-  require(rangeStart < rangeEnd,
-    s"Instantiated a BlockRange with invalid boundaries: $rangeStart to $rangeEnd")
-
-  /**
-   * Returns the size of this range in bytes
-   * @return - Long - size in bytes
-   */
-  def rangeSize(): Long = rangeEnd - rangeStart
-
-  def isComplete(): Boolean = rangeEnd == block.size
-}
-
 /**
  * Given a set of blocks, this iterator returns BlockRanges
  * of such blocks that fit `windowSize`. The ranges are just logical
@@ -90,21 +59,21 @@ class WindowedBlockIterator[T <: BlockWithSize](blocks: Seq[T], windowSize: Long
 
   require(windowSize > 0, s"Invalid window size specified $windowSize")
 
-  private case class BlockWindow(start: Long, size: Long) {
-    val end = start + size // exclusive end offset
+  private class BlockWindow(val start: Long, val size: Long) {
+    val end: Long = start + size // exclusive end offset
     def move(): BlockWindow = {
-      BlockWindow(start + size, size)
+      new BlockWindow(start + size, size)
     }
   }
 
   // start the window at byte 0
-  private[this] var window = BlockWindow(0, windowSize)
+  private[this] var window = new BlockWindow(0, windowSize)
   private[this] var done = false
 
   // helper class that captures the start/end byte offset
   // for `block` on creation
-  private case class BlockWithOffset[T <: BlockWithSize](
-      block: T, startOffset: Long, endOffset: Long)
+  private class BlockWithOffset[T <: BlockWithSize](
+      val block: T, val startOffset: Long, val endOffset: Long)
 
   private[this] val blocksWithOffsets = {
     var lastOffset = 0L
@@ -113,7 +82,7 @@ class WindowedBlockIterator[T <: BlockWithSize](blocks: Seq[T], windowSize: Long
       val startOffset = lastOffset
       val endOffset = startOffset + block.size
       lastOffset = endOffset // for next block
-      BlockWithOffset(block, startOffset, endOffset)
+      new BlockWithOffset(block, startOffset, endOffset)
     }
   }
 
@@ -121,9 +90,10 @@ class WindowedBlockIterator[T <: BlockWithSize](blocks: Seq[T], windowSize: Long
   // is an index into the `blocksWithOffsets` sequence
   private[this] var lastSeenBlock = 0
 
-  case class BlocksForWindow(lastBlockIndex: Option[Int],
-      blockRanges: Seq[BlockRange[T]],
-      hasMoreBlocks: Boolean)
+  private class BlocksForWindow(
+      val lastBlockIndex: Option[Int],
+      val blockRanges: Seq[BlockRange[T]],
+      val hasMoreBlocks: Boolean)
 
   private def getBlocksForWindow(
       window: BlockWindow,
@@ -144,7 +114,7 @@ class WindowedBlockIterator[T <: BlockWithSize](blocks: Seq[T], windowSize: Long
         if (window.end >= b.endOffset) {
           rangeEnd = b.endOffset - b.startOffset
         }
-        blockRangesInWindow.append(BlockRange[T](b.block, rangeStart, rangeEnd))
+        blockRangesInWindow.append(new BlockRange[T](b.block, rangeStart, rangeEnd))
         lastBlockIndex = Some(thisBlock)
       } else {
         // skip this block, unless it's before our window starts
@@ -153,7 +123,7 @@ class WindowedBlockIterator[T <: BlockWithSize](blocks: Seq[T], windowSize: Long
       thisBlock = thisBlock + 1
     }
     val lastBlock = blockRangesInWindow.last
-    BlocksForWindow(lastBlockIndex,
+    new BlocksForWindow(lastBlockIndex,
       blockRangesInWindow.toSeq,
       !continue || !lastBlock.isComplete())
   }
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/sparkRapidsListeners.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/sparkRapidsListeners.scala
index cc95afa51fa..3742e9528ae 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/sparkRapidsListeners.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/sparkRapidsListeners.scala
@@ -18,12 +18,12 @@ package com.nvidia.spark.rapids
 
 import org.apache.spark.scheduler.SparkListenerEvent
 
-case class SparkRapidsBuildInfoEvent(
-  sparkRapidsBuildInfo: Map[String, String],
-  sparkRapidsJniBuildInfo: Map[String, String],
-  cudfBuildInfo: Map[String, String],
-  sparkRapidsPrivateBuildInfo: Map[String, String]
-) extends SparkListenerEvent
+class SparkRapidsBuildInfoEvent(
+  val sparkRapidsBuildInfo: Map[String, String],
+  val sparkRapidsJniBuildInfo: Map[String, String],
+  val cudfBuildInfo: Map[String, String],
+  val sparkRapidsPrivateBuildInfo: Map[String, String]
+) extends SparkListenerEvent with Serializable
 
 /**
  * Event posted when a shuffle is unregistered, containing disk I/O savings statistics.
@@ -37,11 +37,11 @@ case class SparkRapidsBuildInfoEvent(
  * @param numSpills Number of buffers that were spilled to disk
  * @param numForcedFileOnly Number of buffers that used forced file-only mode
  */
-case class SparkRapidsShuffleDiskSavingsEvent(
-  shuffleId: Int,
-  bytesFromMemory: Long,
-  bytesFromDisk: Long,
-  numExpansions: Int = 0,
-  numSpills: Int = 0,
-  numForcedFileOnly: Int = 0
-) extends SparkListenerEvent
+class SparkRapidsShuffleDiskSavingsEvent(
+  val shuffleId: Int,
+  val bytesFromMemory: Long,
+  val bytesFromDisk: Long,
+  val numExpansions: Int,
+  val numSpills: Int,
+  val numForcedFileOnly: Int
+) extends SparkListenerEvent with Serializable
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillFramework.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillFramework.scala
index 2a05e486e9a..dbafe1c4f65 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillFramework.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillFramework.scala
@@ -17,7 +17,7 @@
 package com.nvidia.spark.rapids.spill
 
 import java.io._
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 import java.nio.channels.{Channels, FileChannel, WritableByteChannel}
 import java.nio.file.StandardOpenOption
 import java.util
@@ -27,16 +27,14 @@ import java.util.concurrent.ArrayBlockingQueue
 import scala.collection.mutable
 
 import ai.rapids.cudf._
-import com.nvidia.spark.rapids.{GpuColumnVector, GpuColumnVectorFromBuffer, GpuCompressedColumnVector, GpuDeviceManager, HashedPriorityQueue, HostAlloc, HostMemoryOutputStream, MemoryBufferToHostByteBufferIterator, NvtxId, NvtxRegistry, RapidsConf, RapidsHostColumnVector}
+import com.nvidia.spark.rapids.{GpuColumnVector, GpuColumnVectorFromBuffer, GpuCompressedColumnVector, GpuDeviceManager, HashedPriorityQueue, HostAlloc, HostByteBufferIterator, HostMemoryOutputStream, MemoryBufferToHostByteBufferIterator, NvtxId, NvtxRegistry, RapidsConf, RapidsHostColumnVector}
 import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.RapidsPluginImplicits.AutoCloseableSeq
 import com.nvidia.spark.rapids.format.TableMeta
-import com.nvidia.spark.rapids.internal.HostByteBufferIterator
 import com.nvidia.spark.rapids.jni.TaskPriority
 import org.apache.commons.io.IOUtils
 
 import org.apache.spark.{SparkConf, SparkEnv, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.{GpuTaskMetrics, RapidsDiskBlockManager}
 import org.apache.spark.sql.rapids.execution.{SerializedHostTableUtils, TrampolineUtil}
 import org.apache.spark.sql.rapids.storage.RapidsStorageUtils
@@ -172,7 +170,13 @@ trait StoreHandle extends AutoCloseable {
   var taskPriority: Long = taskId.map(TaskPriority.getTaskPriority).getOrElse(Long.MaxValue)
 }
 
-trait SpillableHandle extends StoreHandle with Logging {
+trait SpillableHandle extends StoreHandle {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    log.warn(msg, throwable)
+  }
+
   /**
    * used to gate when a spill is actively being done so that a second thread won't
    * also begin spilling, and a handle won't release the underlying buffer if it's
@@ -349,7 +353,7 @@ trait HostSpillableHandle[T <: AutoCloseable] extends SpillableHandle {
   }
 }
 
-object SpillableHostBufferHandle extends Logging {
+object SpillableHostBufferHandle {
   def apply(hmb: HostMemoryBuffer): SpillableHostBufferHandle = {
     val handle = new SpillableHostBufferHandle(hmb.getLength, host = Some(hmb))
     SpillFramework.stores.hostStore.trackNoSpill(handle)
@@ -675,7 +679,7 @@ class SpillableColumnarBatchHandle private (
     override val approxSizeInBytes: Long,
     private[spill] override var dev: Option[ColumnarBatch],
     private[spill] var host: Option[SpillableHostBufferHandle] = None)
-  extends DeviceSpillableHandle[ColumnarBatch] with Logging {
+  extends DeviceSpillableHandle[ColumnarBatch] {
 
   override def spillable: Boolean = synchronized {
     if (super.spillable) {
@@ -1305,7 +1309,7 @@ object HandleComparator extends util.Comparator[StoreHandle] {
   }
 }
 
-trait HandleStore[T <: StoreHandle] extends AutoCloseable with Logging {
+trait HandleStore[T <: StoreHandle] extends AutoCloseable {
   protected lazy val handles = new HashedPriorityQueue[T](HandleComparator)
 
   def numHandles: Int = synchronized {
@@ -1358,7 +1362,7 @@ trait HandleStore[T <: StoreHandle] extends AutoCloseable with Logging {
 }
 
 trait SpillableStore[T <: SpillableHandle]
-    extends HandleStore[T] with Logging {
+    extends HandleStore[T] {
   protected def spillNvtxRange: NvtxId
 
   /**
@@ -1480,8 +1484,16 @@ trait SpillableStore[T <: SpillableHandle]
 }
 
 class SpillableHostStore(val maxSize: Option[Long] = None)
-  extends SpillableStore[HostSpillableHandle[_]]
-    with Logging {
+  extends SpillableStore[HostSpillableHandle[_]] {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
 
   private[spill] var totalSize: Long = 0L
 
@@ -1648,7 +1660,7 @@ class SpillableHostStore(val maxSize: Option[Long] = None)
   private class SpillableHostBufferHandleBuilderForHost(
     var handle: SpillableHostBufferHandle,
     var singleShotBuffer: HostMemoryBuffer)
-      extends SpillableHostBufferHandleBuilder with Logging {
+      extends SpillableHostBufferHandleBuilder {
     private var copied = 0L
 
     override def copyNext(mb: DeviceMemoryBuffer, len: Long, stream: Cuda.Stream): Unit = {
@@ -1752,7 +1764,13 @@ class SpillableDeviceStore extends SpillableStore[DeviceSpillableHandle[_]] {
 }
 
 class DiskHandleStore(conf: SparkConf)
-    extends HandleStore[DiskHandle] with Logging {
+    extends HandleStore[DiskHandle] {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
   val diskBlockManager: RapidsDiskBlockManager = new RapidsDiskBlockManager(conf)
 
   def getFile(blockId: BlockId): File = {
@@ -1915,7 +1933,7 @@ class SpillableTableHandle private (
     override val approxSizeInBytes: Long,
     private[spill] override var dev: Option[Table],
     private[spill] var host: Option[SpillableHostBufferHandle] = None)
-  extends DeviceSpillableHandle[Table] with Logging {
+  extends DeviceSpillableHandle[Table] {
 
   override def spillable: Boolean = synchronized {
     if (super.spillable) {
@@ -2047,7 +2065,19 @@ object SpillableTableHandle {
   }
 }
 
-object SpillFramework extends Logging {
+object SpillFramework {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
   // public for tests. Some tests not in the `spill` package require setting this
   // because they need fine control over allocations.
   var storesInternal: SpillableStores = _
@@ -2211,7 +2241,13 @@ private[spill] class BounceBuffer[T <: AutoCloseable](
 class BounceBufferPool[T <: AutoCloseable](private val bufSize: Long,
                                            private val bbCount: Int,
                                            private val allocator: Long => T)
-  extends AutoCloseable with Logging {
+  extends AutoCloseable {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logError(msg: => String): Unit = {
+    log.error(msg)
+  }
+
 
   private val pool = new ArrayBlockingQueue[BounceBuffer[T]](bbCount)
   for (_ <- 1 to bbCount) {
@@ -2277,7 +2313,13 @@ class BounceBufferPool[T <: AutoCloseable](private val bufSize: Long,
  */
 class ChunkedPacker(table: Table,
                     bounceBufferPool: BounceBufferPool[DeviceMemoryBuffer])
-  extends Iterator[(BounceBuffer[DeviceMemoryBuffer], Long)] with Logging with AutoCloseable {
+  extends Iterator[(BounceBuffer[DeviceMemoryBuffer], Long)] with AutoCloseable {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logWarning(msg: => String): Unit = {
+    log.warn(msg)
+  }
+
 
   private var closed: Boolean = false
 
@@ -2310,7 +2352,7 @@ class ChunkedPacker(table: Table,
     val tmpBB = packedMeta.getMetadataDirectBuffer
     val metaCopy = ByteBuffer.allocateDirect(tmpBB.capacity())
     metaCopy.put(tmpBB)
-    metaCopy.flip()
+    metaCopy.asInstanceOf[Buffer].flip()
     metaCopy
   }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillablePartialFileHandle.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillablePartialFileHandle.scala
index 52dfd286773..9f47cd41f0f 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillablePartialFileHandle.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/spill/SpillablePartialFileHandle.scala
@@ -17,14 +17,13 @@
 package com.nvidia.spark.rapids.spill
 
 import java.io.{BufferedInputStream, BufferedOutputStream, File, FileInputStream, FileOutputStream, IOException, RandomAccessFile}
-import java.nio.ByteBuffer
+import java.nio.{Buffer, ByteBuffer}
 import java.nio.channels.FileChannel
 
 import ai.rapids.cudf.HostMemoryBuffer
 import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.HostAlloc
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.GpuTaskMetrics
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 
@@ -74,7 +73,25 @@ class SpillablePartialFileHandle private (
     priority: Long,
     syncWrites: Boolean,
     capacityHintProvider: Option[(Long, Long) => Long])
-  extends HostSpillableHandle[ai.rapids.cudf.HostMemoryBuffer] with Logging {
+  extends HostSpillableHandle[ai.rapids.cudf.HostMemoryBuffer] {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logDebug(msg: => String, throwable: Throwable): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg, throwable)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    log.warn(msg, throwable)
+  }
+
 
   // State management
   @volatile private var spilledToDisk: Boolean = false
@@ -257,7 +274,7 @@ class SpillablePartialFileHandle private (
     withResource(new FileOutputStream(file)) { fos =>
       val channel = fos.getChannel
       val bb = buffer.asByteBuffer()
-      bb.limit(writePosition.toInt)
+      bb.asInstanceOf[Buffer].limit(writePosition.toInt)
       while (bb.hasRemaining) {
         channel.write(bb)
       }
@@ -669,7 +686,7 @@ class SpillablePartialFileHandle private (
       try {
         val channel = fos.getChannel
         val bb = bufferToSpill.asByteBuffer()
-        bb.limit(totalBytesWritten.toInt)
+        bb.asInstanceOf[Buffer].limit(totalBytesWritten.toInt)
         while (bb.hasRemaining) {
           channel.write(bb)
         }
@@ -798,7 +815,7 @@ class SpillablePartialFileHandle private (
   }
 }
 
-object SpillablePartialFileHandle extends Logging {
+object SpillablePartialFileHandle {
 
   /**
    * Create a file-only handle.
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/BasicWindowCalc.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/BasicWindowCalc.scala
index 7ece2df3ef6..8ce4eaa37da 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/BasicWindowCalc.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/BasicWindowCalc.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -39,15 +39,27 @@ import org.apache.spark.unsafe.types.CalendarInterval
  * groups those two together so we can have a complete picture of how to perform these types of
  * aggregations.
  */
-case class AggAndReplace[T](agg: T, nullReplacePolicy: Option[ReplacePolicy])
+class AggAndReplace[T](val agg: T, val nullReplacePolicy: Option[ReplacePolicy])
 
 /**
  * The class represents a window function and the locations of its deduped inputs after an initial
  * projection.
  */
-case class BoundGpuWindowFunction(
-    windowFunc: GpuWindowFunction,
-    boundInputLocations: Array[Int]) {
+class BoundGpuWindowFunction(
+    val windowFunc: GpuWindowFunction,
+    val boundInputLocations: Array[Int]) {
+
+  override def equals(other: Any): Boolean = other match {
+    case that: BoundGpuWindowFunction =>
+      windowFunc == that.windowFunc && boundInputLocations.eq(that.boundInputLocations)
+    case _ => false
+  }
+
+  override def hashCode(): Int = {
+    var result = windowFunc.##
+    result = 31 * result + System.identityHashCode(boundInputLocations)
+    result
+  }
 
   /**
    * Get the operations to perform a scan aggregation.
@@ -141,7 +153,7 @@ object RangeBoundaryValue {
   def double(value: Double): DoubleRangeBoundaryValue = DoubleRangeBoundaryValue(value)
 }
 
-case class ParsedBoundary(isUnbounded: Boolean, value: RangeBoundaryValue)
+class ParsedBoundary(val isUnbounded: Boolean, val value: RangeBoundaryValue) extends Serializable
 
 object GroupedAggregations {
   /**
@@ -295,7 +307,7 @@ object GroupedAggregations {
   private def getRangeBoundaryValue(boundary: Expression, orderByType: DType): ParsedBoundary =
     boundary match {
       case special: GpuSpecialFrameBoundary =>
-        ParsedBoundary(
+        new ParsedBoundary(
           isUnbounded = special.isUnbounded,
           value = orderByType.getTypeId match {
             case DType.DTypeEnum.DECIMAL128 => RangeBoundaryValue.bigInt(special.value)
@@ -308,38 +320,38 @@ object GroupedAggregations {
         // Get the total microseconds for TIMESTAMP_MICROSECONDS
         var x = TimeUnit.DAYS.toMicros(ci.days) + ci.microseconds
         if (x == Long.MinValue) x = Long.MaxValue
-        ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
+        new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
       case GpuLiteral(value, ByteType) =>
         var x = value.asInstanceOf[Byte]
         if (x == Byte.MinValue) x = Byte.MaxValue
-        ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
+        new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
       case GpuLiteral(value, ShortType) =>
         var x = value.asInstanceOf[Short]
         if (x == Short.MinValue) x = Short.MaxValue
-        ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
+        new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
       case GpuLiteral(value, IntegerType) =>
         var x = value.asInstanceOf[Int]
         if (x == Int.MinValue) x = Int.MaxValue
-        ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
+        new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
       case GpuLiteral(value, LongType) =>
         var x = value.asInstanceOf[Long]
         if (x == Long.MinValue) x = Long.MaxValue
-        ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
+        new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.long(Math.abs(x)))
       case GpuLiteral(value, FloatType) =>
         var x = value.asInstanceOf[Float]
         if (x == Float.MinValue) x = Float.MaxValue
-        ParsedBoundary(isUnbounded = false, RangeBoundaryValue.double(Math.abs(x)))
+        new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.double(Math.abs(x)))
       case GpuLiteral(value, DoubleType) =>
         var x = value.asInstanceOf[Double]
         if (x == Double.MinValue) x = Double.MaxValue
-        ParsedBoundary(isUnbounded = false, RangeBoundaryValue.double(Math.abs(x)))
+        new ParsedBoundary(isUnbounded = false, RangeBoundaryValue.double(Math.abs(x)))
       case GpuLiteral(value: Decimal, DecimalType()) =>
         orderByType.getTypeId match {
           case DType.DTypeEnum.DECIMAL32 | DType.DTypeEnum.DECIMAL64 =>
-            ParsedBoundary(isUnbounded = false,
+            new ParsedBoundary(isUnbounded = false,
               RangeBoundaryValue.long(Math.abs(value.toUnscaledLong)))
           case DType.DTypeEnum.DECIMAL128 =>
-            ParsedBoundary(isUnbounded = false,
+            new ParsedBoundary(isUnbounded = false,
               RangeBoundaryValue.bigInt(value.toJavaBigDecimal.unscaledValue().abs))
           case anythingElse =>
             throw new UnsupportedOperationException(s"Unexpected Decimal type: $anythingElse")
@@ -378,7 +390,7 @@ class GroupedAggregations {
       data.getOrElseUpdate(win.normalizedFrameSpec, mutable.HashMap.empty)
     }
 
-    forSpec.getOrElseUpdate(BoundGpuWindowFunction(win.wrappedWindowFunc, inputLocs),
+    forSpec.getOrElseUpdate(new BoundGpuWindowFunction(win.wrappedWindowFunc, inputLocs),
       ArrayBuffer.empty) += outputIndex
   }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuBatchedBoundedWindowExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuBatchedBoundedWindowExec.scala
index 49e6d5b23be..dbc2d99c054 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuBatchedBoundedWindowExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuBatchedBoundedWindowExec.scala
@@ -24,7 +24,6 @@ import com.nvidia.spark.rapids.RmmRapidsRetryIterator.withRetryNoSplit
 import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.expressions.{Expression, NamedExpression, SortOrder}
 import org.apache.spark.sql.execution.SparkPlan
@@ -41,7 +40,7 @@ class GpuBatchedBoundedWindowIterator(
   maxFollowing: Int,
   numOutputBatches: GpuMetric,
   numOutputRows: GpuMetric,
-  opTime: GpuMetric) extends Iterator[ColumnarBatch] with BasicWindowCalc with Logging {
+  opTime: GpuMetric) extends Iterator[ColumnarBatch] with BasicWindowCalc with RapidsLocalLog {
 
   override def isRunningBatched: Boolean = false  // Not "Running Window" optimized.
                                                   // This is strictly for batching.
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuRunningWindowExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuRunningWindowExec.scala
index a87aea8b954..a1e7271e6b1 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuRunningWindowExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuRunningWindowExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -242,10 +242,10 @@ case class GpuRunningWindowExec(
     }
     if (gpuPartitionSpec.isEmpty) {
       // If unpartitioned, batch on the order-by column.
-      BatchedByKey(gpuOrderSpec)(cpuOrderSpec)
+      new BatchedByKey(gpuOrderSpec)(cpuOrderSpec)
     } else {
       // If partitioned, batch on partition-columns + order-by columns.
-      BatchedByKey(gpuPartitionOrdering ++ gpuOrderSpec)(cpuPartitionOrdering ++ cpuOrderSpec)
+      new BatchedByKey(gpuPartitionOrdering ++ gpuOrderSpec)(cpuPartitionOrdering ++ cpuOrderSpec)
     }
   }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowExec.scala
index d244550b878..30ffc771d70 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -125,8 +125,8 @@ object TableAndBatchUtils {
 // the ride-along columns and the aggregation result should both be sorted by the partition by
 // columns.  Also the aggregation result must have a count column so it can be expanded using
 // repeat to get back to the size of the ride-along columns.
-case class FirstPassAggResult(rideAlongColumns: SpillableColumnarBatch,
-    aggResult: SpillableColumnarBatch) extends AutoCloseable {
+class FirstPassAggResult(val rideAlongColumns: SpillableColumnarBatch,
+    val aggResult: SpillableColumnarBatch) extends AutoCloseable {
   override def close(): Unit = {
     rideAlongColumns.close()
     aggResult.close()
@@ -219,7 +219,7 @@ class GpuUnboundedToUnboundedAggWindowFirstPassIterator(
               val rideAlongColumns = GpuProjectExec.project(preProcessedInput,
                 boundStages.boundRideAlong)
 
-              FirstPassAggResult(
+              new FirstPassAggResult(
                 adoptAndMakeSpillable(rideAlongColumns),
                 toSpillableBatch(aggResultTable,
                   boundStages.groupingColumnTypes ++ boundStages.aggResultTypes))
@@ -333,8 +333,8 @@ class PartitionedFirstPassAggResult(firstPassAggResult: FirstPassAggResult,
 // an iterator of ride-along columns, and the full agg results for those columns. It is not
 // the responsibility of the second stage to try and combine small batches or split up large
 // ones, beyond what the retry framework might do.
-case class SecondPassAggResult(rideAlongColumns: util.LinkedList[SpillableColumnarBatch],
-                               aggResult: SpillableColumnarBatch) extends AutoCloseable {
+class SecondPassAggResult(val rideAlongColumns: util.LinkedList[SpillableColumnarBatch],
+                               val aggResult: SpillableColumnarBatch) extends AutoCloseable {
   override def close(): Unit = {
     rideAlongColumns.forEach(_.close())
     rideAlongColumns.clear()
@@ -467,7 +467,7 @@ class GpuUnboundedToUnboundedAggWindowSecondPassIterator(
                   .asInstanceOf[util.LinkedList[SpillableColumnarBatch]]
               completedRideAlongBatches.add(partitioned.otherGroupRideAlong.get)
               val groupsRemoved = removeGroupColumns(mergedAggResults)
-              SecondPassAggResult(completedRideAlongBatches,
+              new SecondPassAggResult(completedRideAlongBatches,
                                   groupsRemoved)
             }
           }
@@ -503,7 +503,7 @@ class GpuUnboundedToUnboundedAggWindowSecondPassIterator(
                                 boundStages.groupingColumnTypes ++
                                   boundStages.aggResultTypes)) { concatAggResults =>
               withResource(groupByMerge(concatAggResults)) { mergedAggResults =>
-                Some(SecondPassAggResult(rideAlongColumnsPendingCompletion,
+                Some(new SecondPassAggResult(rideAlongColumnsPendingCompletion,
                      removeGroupColumns(mergedAggResults)))
               }
             }
@@ -521,8 +521,8 @@ class GpuUnboundedToUnboundedAggWindowSecondPassIterator(
 // The next to final step is to take the original input data along with the agg data, estimate how
 // to split/combine the input batches to output batches that are close to the target batch size.
 
-case class SlicedBySize(rideAlongColumns: SpillableColumnarBatch,
-    aggResults: SpillableColumnarBatch) extends AutoCloseable {
+class SlicedBySize(val rideAlongColumns: SpillableColumnarBatch,
+    val aggResults: SpillableColumnarBatch) extends AutoCloseable {
   override def close(): Unit = {
     rideAlongColumns.close()
     aggResults.close()
@@ -827,9 +827,9 @@ class PendingSecondAggResults private(
       if (rideAlongColumns.isEmpty) {
         // This is the last batch so we don't need to even figure out where to slice
         // the AggResult
-        SlicedBySize(rideAlongScb, aggResult.incRefCount())
+        new SlicedBySize(rideAlongScb, aggResult.incRefCount())
       } else {
-        SlicedBySize(rideAlongScb, getSlicedAggResultByRepeatedRows(rideAlongScb.numRows()))
+        new SlicedBySize(rideAlongScb, getSlicedAggResultByRepeatedRows(rideAlongScb.numRows()))
       }
     }
   }
@@ -943,12 +943,12 @@ class GpuUnboundedToUnboundedAggFinalIterator(
  * @param boundAggregations aggregations to be done. NOTE THIS IS WIP
  * @param boundFinalProject the final project to get the output in the right order
  */
-case class GpuUnboundedToUnboundedAggStages(
-    inputTypes: Seq[DataType],
-    boundPartitionSpec: Seq[GpuExpression],
-    boundRideAlong: Seq[GpuExpression],
-    boundAggregations: Seq[GpuExpression],
-    boundFinalProject: Seq[GpuExpression]) extends Serializable {
+class GpuUnboundedToUnboundedAggStages(
+    val inputTypes: Seq[DataType],
+    val boundPartitionSpec: Seq[GpuExpression],
+    val boundRideAlong: Seq[GpuExpression],
+    val boundAggregations: Seq[GpuExpression],
+    val boundFinalProject: Seq[GpuExpression]) extends Serializable {
 
   val groupingColumnTypes: Seq[DataType] = boundPartitionSpec.map{_.dataType}
   val groupColumnOrdinals: Seq[Int] = boundPartitionSpec.map {
@@ -1108,7 +1108,7 @@ object GpuUnboundedToUnboundedAggWindowIterator {
     val finalProject = computeFinalProject(rideAlongOutput, aggsToRepeatOutput, windowOps,
       metrics)
 
-    GpuUnboundedToUnboundedAggStages(childTypes, boundPartitionSpec, boundRideAlong,
+    new GpuUnboundedToUnboundedAggStages(childTypes, boundPartitionSpec, boundRideAlong,
                                      boundAggregations, finalProject)
   }
 
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExec.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExec.scala
index 8bf8a0e9dd3..7617a807260 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExec.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -157,7 +157,7 @@ case class GpuWindowExec(
   override def outputBatching: CoalesceGoal = if (gpuPartitionSpec.isEmpty) {
     RequireSingleBatch
   } else {
-    BatchedByKey(gpuPartitionOrdering)(cpuPartitionOrdering)
+    new BatchedByKey(gpuPartitionOrdering)(cpuPartitionOrdering)
   }
 
   override protected def internalDoExecuteColumnar(): RDD[ColumnarBatch] = {
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExecMeta.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExecMeta.scala
index fdb786d98f9..792ca5bff94 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExecMeta.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExecMeta.scala
@@ -221,11 +221,12 @@ class GpuWindowExecMeta(windowExec: WindowExec,
   override def getResultColumnsOnly: Boolean = resultColumnsOnly
 }
 
-case class BatchedOps(running: Seq[NamedExpression],
-    unboundedAgg: Seq[NamedExpression],
-    unboundedDoublePass: Seq[NamedExpression],
-    bounded: Seq[NamedExpression],
-    passThrough: Seq[NamedExpression]) {
+class BatchedOps(
+    val running: Seq[NamedExpression],
+    val unboundedAgg: Seq[NamedExpression],
+    val unboundedDoublePass: Seq[NamedExpression],
+    val bounded: Seq[NamedExpression],
+    val passThrough: Seq[NamedExpression]) {
 
   private def dedupeByExprId[T <: NamedExpression](exprs: Seq[T]): Seq[T] = {
     val seen = mutable.HashSet.empty[ExprId]
@@ -614,7 +615,7 @@ object GpuWindowExecMeta {
         throw new IllegalArgumentException(
           s"Found unexpected expression $other in window exec ${other.getClass}")
     }
-    BatchedOps(running.toSeq,
+    new BatchedOps(running.toSeq,
                unboundedToUnboundedAgg.toSeq,
                doublePass.toSeq,
                batchedBounded.toSeq,
diff --git a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExpression.scala b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExpression.scala
index 2ea997a222d..280f8e9e2a8 100644
--- a/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExpression.scala
+++ b/sql-plugin/src/main/scala/com/nvidia/spark/rapids/window/GpuWindowExpression.scala
@@ -28,7 +28,6 @@ import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.shims.{GpuWindowUtil, ShimExpression}
 import scala.util.{Left, Right}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult.{TypeCheckFailure, TypeCheckSuccess}
 import org.apache.spark.sql.catalyst.expressions._
@@ -1088,7 +1087,7 @@ class BatchedUnboundedToUnboundedBinaryFixer(val binOp: BinaryOp, val dataType:
  * right thing when they see a null.
  */
 class BatchedRunningWindowBinaryFixer(val binOp: BinaryOp, val name: String)
-    extends BatchedRunningWindowFixer with Logging {
+    extends BatchedRunningWindowFixer with RapidsLocalLog {
   private var previousResult: Option[Scalar] = None
 
   // checkpoint
@@ -1157,7 +1156,7 @@ class BatchedRunningWindowBinaryFixer(val binOp: BinaryOp, val name: String)
  * @param ignoreNulls Whether the function needs to ignore NULL values in the calculation.
  */
 abstract class FirstLastRunningWindowFixerBase(val name: String, val ignoreNulls: Boolean = false)
-  extends BatchedRunningWindowFixer with Logging {
+  extends BatchedRunningWindowFixer with RapidsLocalLog {
 
   /**
    * Saved "carry-over" result that might be applied to the next batch.
@@ -1365,7 +1364,7 @@ class LastRunningWindowFixer(ignoreNulls: Boolean = false)
  * might be able to make this more generic but we need to see what the use case really is.
  */
 class SumBinaryFixer(toType: DataType, isAnsi: Boolean)
-    extends BatchedRunningWindowFixer with Logging {
+    extends BatchedRunningWindowFixer with RapidsLocalLog {
   private val name = "sum"
   private var previousResult: Option[Scalar] = None
   private var previousOverflow: Option[Scalar] = None
@@ -1642,7 +1641,7 @@ class SumBinaryFixer(toType: DataType, isAnsi: Boolean)
  * happens in the `scanCombine` method for GpuRank.  It is a little ugly but it works to maintain
  * the requirement that the input to the fixer is a single column.
  */
-class RankFixer extends BatchedRunningWindowFixer with Logging {
+class RankFixer extends BatchedRunningWindowFixer with RapidsLocalLog {
   import RankFixer._
 
   // We have to look at row number as well as rank.  This fixer is the same one that `GpuRowNumber`
@@ -1769,7 +1768,7 @@ object RankFixer {
  * If anything is outside of a continues partition by group then we just keep
  * those values unchanged.
  */
-class DenseRankFixer extends BatchedRunningWindowFixer with Logging {
+class DenseRankFixer extends BatchedRunningWindowFixer with RapidsLocalLog {
   import DenseRankFixer._
 
   private var previousRank: Option[Scalar] = None
@@ -1942,11 +1941,11 @@ case class GpuRank(children: Seq[Expression]) extends GpuRunningWindowFunction
       isRunningBatched: Boolean): Seq[AggAndReplace[GroupByScanAggregation]] = {
     if (isRunningBatched) {
       // We are computing both rank and row number so we can fix it up at the end
-      Seq(AggAndReplace(GroupByScanAggregation.rank(), None),
-        AggAndReplace(GroupByScanAggregation.sum(), None))
+      Seq(new AggAndReplace(GroupByScanAggregation.rank(), None),
+        new AggAndReplace(GroupByScanAggregation.sum(), None))
     } else {
       // Not batched just do the rank
-      Seq(AggAndReplace(GroupByScanAggregation.rank(), None))
+      Seq(new AggAndReplace(GroupByScanAggregation.rank(), None))
     }
   }
 
@@ -1955,10 +1954,12 @@ case class GpuRank(children: Seq[Expression]) extends GpuRunningWindowFunction
   override def scanAggregation(isRunningBatched: Boolean): Seq[AggAndReplace[ScanAggregation]] = {
     if (isRunningBatched) {
       // We are computing both rank and row number so we can fix it up at the end
-      Seq(AggAndReplace(ScanAggregation.rank(), None), AggAndReplace(ScanAggregation.sum(), None))
+      Seq(
+        new AggAndReplace(ScanAggregation.rank(), None),
+        new AggAndReplace(ScanAggregation.sum(), None))
     } else {
       // Not batched just do the rank
-      Seq(AggAndReplace(ScanAggregation.rank(), None))
+      Seq(new AggAndReplace(ScanAggregation.rank(), None))
     }
   }
 
@@ -2007,13 +2008,13 @@ case class GpuDenseRank(children: Seq[Expression]) extends GpuRunningWindowFunct
 
   override def groupByScanAggregation(
       isRunningBatched: Boolean): Seq[AggAndReplace[GroupByScanAggregation]] =
-    Seq(AggAndReplace(GroupByScanAggregation.denseRank(), None))
+    Seq(new AggAndReplace(GroupByScanAggregation.denseRank(), None))
 
   override def scanInputProjection(isRunningBatched: Boolean): Seq[Expression] =
     groupByScanInputProjection(isRunningBatched)
 
   override def scanAggregation(isRunningBatched: Boolean): Seq[AggAndReplace[ScanAggregation]] =
-    Seq(AggAndReplace(ScanAggregation.denseRank(), None))
+    Seq(new AggAndReplace(ScanAggregation.denseRank(), None))
 
   override def newFixer(): BatchedRunningWindowFixer = new DenseRankFixer()
 }
@@ -2040,14 +2041,14 @@ case object GpuRowNumber extends GpuRunningWindowFunction
 
   override def groupByScanAggregation(
       isRunningBatched: Boolean): Seq[AggAndReplace[GroupByScanAggregation]] =
-    Seq(AggAndReplace(GroupByScanAggregation.sum(), None))
+    Seq(new AggAndReplace(GroupByScanAggregation.sum(), None))
 
   // For regular scans cudf does not support ROW_NUMBER, nor does it support COUNT_ALL
   // so we will do a SUM on a column of 1s
   override def scanInputProjection(isRunningBatched: Boolean): Seq[Expression] =
     groupByScanInputProjection(isRunningBatched)
   override def scanAggregation(isRunningBatched: Boolean): Seq[AggAndReplace[ScanAggregation]] =
-    Seq(AggAndReplace(ScanAggregation.sum(), None))
+    Seq(new AggAndReplace(ScanAggregation.sum(), None))
 
   override def scanCombine(isRunningBatched: Boolean, cols: Seq[ColumnVector]): ColumnVector = {
     cols.head.castTo(DType.INT32)
diff --git a/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/CoalesceConvertIterator.scala b/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/CoalesceConvertIterator.scala
index adfb2f6c58b..7136fa4c368 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/CoalesceConvertIterator.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/CoalesceConvertIterator.scala
@@ -22,7 +22,6 @@ import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.hybrid.{CoalesceBatchConverter => NativeConverter, HybridHostRetryAllocator, RapidsHostColumn}
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.Attribute
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.vectorized.{ColumnarBatch, ColumnVector}
@@ -36,7 +35,13 @@ class CoalesceConvertIterator(cpuScanIter: Iterator[ColumnarBatch],
                               targetBatchSizeInBytes: Long,
                               schema: StructType,
                               metrics: Map[String, GpuMetric])
-  extends Iterator[Array[RapidsHostColumn]] with Logging {
+  extends Iterator[Array[RapidsHostColumn]] {
+
+  @transient private lazy val log = org.slf4j.LoggerFactory.getLogger(
+    classOf[CoalesceConvertIterator])
+
+  private def logInfo(msg: => String): Unit = if (log.isInfoEnabled) log.info(msg)
+
 
   private var converterImpl: NativeConverter = _
 
@@ -140,7 +145,7 @@ class CoalesceConvertIterator(cpuScanIter: Iterator[ColumnarBatch],
   }
 }
 
-object CoalesceConvertIterator extends Logging {
+object CoalesceConvertIterator {
   /**
    * Consumes the RapidsHostBatchProducer and converts the HostColumnVectors to Device ones.
    */
diff --git a/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/HybridExecutionUtils.scala b/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/HybridExecutionUtils.scala
index c4bc1c73ff9..c653cf8e6b1 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/HybridExecutionUtils.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/HybridExecutionUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,7 +21,6 @@ import java.util.Locale
 import ai.rapids.cudf.DType
 import com.nvidia.spark.rapids.{RapidsConf, VersionUtils}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, UnresolvedHint}
 import org.apache.spark.sql.catalyst.trees.TreePattern
@@ -33,7 +32,6 @@ import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.sql.types._
 
 object HybridExecutionUtils extends PredicateHelper {
-  
   private val HYBRID_JAR_PLUGIN_CLASS_NAME = "com.nvidia.spark.rapids.hybrid.HybridPluginWrapper"
 
   /**
@@ -434,7 +432,7 @@ object HybridExecutionUtils extends PredicateHelper {
   }
 }
 
-object HybridExecOverrides extends Logging {
+object HybridExecOverrides {
   // The SQL hint enables HybridScan for specific tables even if HYBRID_PARQUET_READER is disabled
   val HYBRID_SCAN_HINT = "HYBRID_SCAN"
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/RapidsHostBatchProducer.scala b/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/RapidsHostBatchProducer.scala
index 3212d9bfe3d..0fb80cdb513 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/RapidsHostBatchProducer.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/rapids/hybrid/RapidsHostBatchProducer.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -25,7 +25,6 @@ import com.nvidia.spark.rapids.hybrid.RapidsHostColumn
 import com.nvidia.spark.rapids.jni.RmmSpark
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 
 /**
@@ -92,7 +91,15 @@ class PrefetchHostBatchProducer(
     taskAttId: Long,
     base: Iterator[Array[RapidsHostColumn]],
     capacity: Int,
-    waitTimeMetric: GpuMetric) extends RapidsHostBatchProducer with Logging {
+    waitTimeMetric: GpuMetric) extends RapidsHostBatchProducer {
+
+  @transient private lazy val log = org.slf4j.LoggerFactory.getLogger(
+    classOf[PrefetchHostBatchProducer])
+
+  private def logInfo(msg: => String): Unit = if (log.isInfoEnabled) log.info(msg)
+
+  private def logError(msg: => String): Unit = if (log.isErrorEnabled) log.error(msg)
+
 
   @volatile private var isInit: Boolean = false
   // Mark if there is in-progress element being produced in producerThread
diff --git a/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleExecutorComponents.scala b/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleExecutorComponents.scala
index e923d57ab83..af7f212bbd6 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleExecutorComponents.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleExecutorComponents.scala
@@ -21,7 +21,6 @@ import java.util.{Map => JMap, Optional}
 import com.google.common.annotations.VisibleForTesting
 
 import org.apache.spark.{SparkConf, SparkEnv}
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.IndexShuffleBlockResolver
 import org.apache.spark.shuffle.api.{ShuffleExecutorComponents, ShuffleMapOutputWriter, SingleSpillShuffleMapOutputWriter}
 import org.apache.spark.storage.BlockManager
@@ -31,7 +30,7 @@ import org.apache.spark.storage.BlockManager
  * instances with host memory buffer support.
  */
 class RapidsLocalDiskShuffleExecutorComponents(sparkConf: SparkConf)
-  extends ShuffleExecutorComponents with Logging {
+  extends ShuffleExecutorComponents {
 
   private var blockManager: BlockManager = null
   private var blockResolver: IndexShuffleBlockResolver = null
diff --git a/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleMapOutputWriter.scala b/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleMapOutputWriter.scala
index 3a0360d143c..1578d39b43d 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleMapOutputWriter.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/shuffle/sort/io/RapidsLocalDiskShuffleMapOutputWriter.scala
@@ -25,7 +25,6 @@ import com.nvidia.spark.rapids.{HostAlloc, RapidsConf}
 import com.nvidia.spark.rapids.spill.SpillablePartialFileHandle
 
 import org.apache.spark.SparkConf
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.IndexShuffleBlockResolver
 import org.apache.spark.shuffle.api.{ShuffleMapOutputWriter, ShufflePartitionWriter, WritableByteChannelWrapper}
 import org.apache.spark.shuffle.api.metadata.MapOutputCommitMessage
@@ -42,7 +41,17 @@ class RapidsLocalDiskShuffleMapOutputWriter(
     numPartitions: Int,
     blockResolver: IndexShuffleBlockResolver,
     sparkConf: SparkConf)
-  extends ShuffleMapOutputWriter with Logging {
+  extends ShuffleMapOutputWriter {
+  @transient private lazy val log = org.slf4j.LoggerFactory.getLogger(
+    classOf[RapidsLocalDiskShuffleMapOutputWriter])
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) log.warn(msg, throwable)
+  }
 
   private val partitionLengths = new Array[Long](numPartitions)
   private var lastPartitionId = -1
diff --git a/sql-plugin/src/main/spark350/scala/org/apache/spark/sql/catalyst/GpuProjectingColumnarBatch.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/GpuProjectingColumnarBatch.scala
similarity index 71%
rename from sql-plugin/src/main/spark350/scala/org/apache/spark/sql/catalyst/GpuProjectingColumnarBatch.scala
rename to sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/GpuProjectingColumnarBatch.scala
index 291a9ec5b06..7030857869a 100644
--- a/sql-plugin/src/main/spark350/scala/org/apache/spark/sql/catalyst/GpuProjectingColumnarBatch.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/GpuProjectingColumnarBatch.scala
@@ -13,23 +13,6 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-
-
-/*** spark-rapids-shim-json-lines
-{"spark": "350"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-{"spark": "400"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
 package org.apache.spark.sql.catalyst
 
 import com.nvidia.spark.rapids.Arm.closeOnExcept
@@ -43,9 +26,9 @@ case class GpuProjectingColumnarBatch(schema: StructType, colOrdinals: Seq[Int])
 
   /**
    * Project a subset of columns from a `ColumnarBatch` onto a new batch
-   * based on the specified column ordinals and output schema. 
+   * based on the specified column ordinals and output schema.
    *
-   * @param batch The input batch to project. It's caller's responsibility to close batch.
+   * @param batch The input batch to project. It is the caller's responsibility to close batch.
    * @return The projected batch.
    */
   def project(batch: ColumnarBatch): ColumnarBatch = {
@@ -60,7 +43,13 @@ case class GpuProjectingColumnarBatch(schema: StructType, colOrdinals: Seq[Int])
 }
 
 object GpuProjectingColumnarBatch {
-  def apply(cpu: ProjectingInternalRow): GpuProjectingColumnarBatch = {
-    GpuProjectingColumnarBatch(cpu.schema, cpu.colOrdinals)
+  def apply(cpu: AnyRef): GpuProjectingColumnarBatch = {
+    GpuProjectingColumnarBatch(
+      invokeNoArg(cpu, "schema").asInstanceOf[StructType],
+      invokeNoArg(cpu, "colOrdinals").asInstanceOf[Seq[Int]])
+  }
+
+  private def invokeNoArg(target: AnyRef, methodName: String): AnyRef = {
+    target.getClass.getMethod(methodName).invoke(target)
   }
 }
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuJsonScan.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuJsonScan.scala
index 9e367679891..25bff7901ab 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuJsonScan.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuJsonScan.scala
@@ -268,7 +268,7 @@ case class GpuJsonScan(
     val broadcastedConf = sparkSession.sparkContext.broadcast(
       new SerializableConfiguration(hadoopConf))
 
-    GpuJsonPartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
+    new GpuJsonPartitionReaderFactory(sparkSession.sessionState.conf, broadcastedConf,
       dataSchema, readDataSchema, readPartitionSchema, parsedOptions, maxReaderBatchSizeRows,
       maxReaderBatchSizeBytes, maxGpuColumnSizeBytes, metrics, options.asScala.toMap)
   }
@@ -276,7 +276,7 @@ case class GpuJsonScan(
   override def withInputFile(): GpuScan = this
 }
 
-case class GpuJsonPartitionReaderFactory(
+class GpuJsonPartitionReaderFactory(
     sqlConf: SQLConf,
     broadcastedConf: Broadcast[SerializableConfiguration],
     dataSchema: StructType,
@@ -288,7 +288,8 @@ case class GpuJsonPartitionReaderFactory(
     maxReaderBatchSizeBytes: Long,
     maxGpuColumnSizeBytes: Long,
     metrics: Map[String, GpuMetric],
-    @transient params: Map[String, String]) extends ShimFilePartitionReaderFactory(params) {
+    @transient params: Map[String, String])
+  extends ShimFilePartitionReaderFactory(params) with Serializable {
 
   override def buildReader(partitionedFile: PartitionedFile): PartitionReader[InternalRow] = {
     throw new IllegalStateException("ROW BASED PARSING IS NOT SUPPORTED ON THE GPU...")
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuReadJsonFileFormat.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuReadJsonFileFormat.scala
index 3a80180b154..bb5fcee97a3 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuReadJsonFileFormat.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/catalyst/json/rapids/GpuReadJsonFileFormat.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -56,7 +56,7 @@ class GpuReadJsonFileFormat extends JsonFileFormat with GpuReadFileFormatWithMet
       sparkSession.sessionState.conf.sessionLocalTimeZone,
       sparkSession.sessionState.conf.columnNameOfCorruptRecord)
     val rapidsConf = new RapidsConf(sqlConf)
-    val factory = GpuJsonPartitionReaderFactory(
+    val factory = new GpuJsonPartitionReaderFactory(
       sqlConf,
       broadcastedHadoopConf,
       dataSchema,
@@ -81,7 +81,7 @@ class GpuReadJsonFileFormat extends JsonFileFormat with GpuReadFileFormatWithMet
   }
 }
 
-object GpuReadJsonFileFormat {
+object GpuReadJsonFileFormat extends Serializable {
   def tagSupport(meta: SparkPlanMeta[FileSourceScanExec]): Unit = {
     val fsse = meta.wrapped
     GpuJsonScan.tagSupport(
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveFileFormat.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveFileFormat.scala
index 0861f36b064..7a99acb6770 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveFileFormat.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveFileFormat.scala
@@ -27,7 +27,6 @@ import com.nvidia.spark.rapids.jni.fileio.RapidsFileIO
 import com.nvidia.spark.rapids.shims.BucketingUtilsShim
 import org.apache.hadoop.mapreduce.{Job, TaskAttemptContext}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.execution.datasources.parquet.ParquetOptions
 import org.apache.spark.sql.hive.rapids.shims.GpuInsertIntoHiveTableMeta
@@ -36,7 +35,7 @@ import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.sql.types.{DataType, Decimal, DecimalType, StringType, StructType}
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-object GpuHiveFileFormat extends Logging {
+object GpuHiveFileFormat {
   private val parquetOutputFormatClass =
     "org.apache.hadoop.hive.ql.io.parquet.MapredParquetOutputFormat"
   private val parquetSerdeClass =
@@ -199,7 +198,7 @@ object GpuHiveFileFormat extends Logging {
 }
 
 class GpuHiveParquetFileFormat(compType: CompressionType) extends ColumnarFileFormat
-    with Logging with Serializable {
+    with Serializable with RapidsLocalLog {
 
   override def prepareWrite(sparkSession: SparkSession, job: Job,
       options: Map[String, String], dataSchema: StructType): ColumnarOutputWriterFactory = {
@@ -264,7 +263,7 @@ class GpuHiveParquetWriter(override val path: String, dataSchema: StructType,
 
 }
 
-class GpuHiveTextFileFormat extends ColumnarFileFormat with Logging with Serializable {
+class GpuHiveTextFileFormat extends ColumnarFileFormat with Serializable {
 
   override def supportDataType(dataType: DataType): Boolean =
     GpuHiveTextFileUtils.isSupportedType(dataType)
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveTableScanExec.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveTableScanExec.scala
index e806790cdb2..359b111db6f 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveTableScanExec.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/GpuHiveTableScanExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -90,6 +90,8 @@ case class GpuHiveTableScanExec(requestedAttributes: Seq[Attribute],
 
   val partitionAttributes: Seq[AttributeReference] = hiveTableRelation.partitionCols
 
+  private def shimSparkSession: SparkSession = sparkSession.asInstanceOf[SparkSession]
+
   // CPU expression to prune Hive partitions, based on [[partitionPruningPredicate]].
   // Bind all partition key attribute references in the partition pruning predicate for later
   // evaluation.
@@ -140,7 +142,7 @@ case class GpuHiveTableScanExec(requestedAttributes: Seq[Attribute],
         prunePartitions(hivePartitions)
       }
     } else {
-      if (sparkSession.sessionState.conf.metastorePartitionPruning &&
+      if (shimSparkSession.sessionState.conf.metastorePartitionPruning &&
         partitionPruningPredicate.nonEmpty) {
         rawPartitions
       } else {
@@ -152,16 +154,16 @@ case class GpuHiveTableScanExec(requestedAttributes: Seq[Attribute],
   // exposed for tests
   @transient lazy val rawPartitions: Seq[HivePartition] = {
     val prunedPartitions =
-      if (sparkSession.sessionState.conf.metastorePartitionPruning &&
+      if (shimSparkSession.sessionState.conf.metastorePartitionPruning &&
         partitionPruningPredicate.nonEmpty) {
         // Retrieve the original attributes based on expression ID so that capitalization matches.
         val normalizedFilters = partitionPruningPredicate.map(_.transform {
           case a: AttributeReference => originalAttributes(a)
         })
-        sparkSession.sessionState.catalog
+        shimSparkSession.sessionState.catalog
           .listPartitionsByFilter(hiveTableRelation.tableMeta.identifier, normalizedFilters)
       } else {
-        sparkSession.sessionState.catalog.listPartitions(hiveTableRelation.tableMeta.identifier)
+        shimSparkSession.sessionState.catalog.listPartitions(hiveTableRelation.tableMeta.identifier)
       }
     prunedPartitions.map(HiveClientImpl.toHivePartition(_, hiveQlTable))
   }
@@ -202,7 +204,7 @@ case class GpuHiveTableScanExec(requestedAttributes: Seq[Attribute],
                           readSchema: StructType,
                           options: Map[String, String]
               ): PartitionedFile => Iterator[InternalRow] = {
-    val readerFactory = GpuHiveTextPartitionReaderFactory(
+    val readerFactory = new GpuHiveTextPartitionReaderFactory(
       sqlConf = sqlConf,
       broadcastConf = broadcastConf,
       inputFileSchema = dataSchema,
@@ -329,13 +331,13 @@ case class GpuHiveTableScanExec(requestedAttributes: Seq[Attribute],
     // Assume Delimited text.
     val options                   = hiveTableRelation.tableMeta.properties ++
                                     hiveTableRelation.tableMeta.storage.properties
-    val hadoopConf                = sparkSession.sessionState.newHadoopConf()
+    val hadoopConf                = shimSparkSession.sessionState.newHadoopConf()
     // In the CPU HiveTableScanExec the config will have a bunch of confs set for S3 keys
     // and predicate push down/etc. We don't need this because we are getting that information
     // directly.
-    val broadcastHadoopConf       = sparkSession.sparkContext.broadcast(
+    val broadcastHadoopConf       = shimSparkSession.sparkContext.broadcast(
                                       new SerializableConfiguration(hadoopConf))
-    val sqlConf                   = sparkSession.sessionState.conf
+    val sqlConf                   = shimSparkSession.sessionState.conf
     val rapidsConf                = new RapidsConf(sqlConf)
     val requestedOutputDataSchema = getRequestedOutputDataSchema(hiveTableRelation.tableMeta.schema,
                                                                  partitionAttributes,
@@ -349,10 +351,10 @@ case class GpuHiveTableScanExec(requestedAttributes: Seq[Attribute],
                                                 options)
     val rdd = if (hiveTableRelation.isPartitioned) {
       createReadRDDForPartitions(reader, hiveTableRelation, requestedOutputDataSchema,
-                                 sparkSession, hadoopConf)
+                                 shimSparkSession, hadoopConf)
     } else {
       createReadRDDForTable(reader, hiveTableRelation, requestedOutputDataSchema,
-                            sparkSession, hadoopConf)
+                            shimSparkSession, hadoopConf)
     }
     sendDriverMetrics()
     rdd
@@ -439,18 +441,19 @@ class AlphabeticallyReorderingColumnPartitionReader(fileReader: PartitionReader[
 }
 
 // Factory to build the columnar reader.
-case class GpuHiveTextPartitionReaderFactory(sqlConf: SQLConf,
-                                             broadcastConf: Broadcast[SerializableConfiguration],
-                                             inputFileSchema: StructType,
-                                             partitionSchema: StructType,
-                                             requestedOutputDataSchema: StructType,
-                                             requestedAttributes: Seq[Attribute],
-                                             maxReaderBatchSizeRows: Integer,
-                                             maxReaderBatchSizeBytes: Long,
-                                             maxGpuColumnSizeBytes: Long,
-                                             metrics: Map[String, GpuMetric],
-                                             params: Map[String, String])
-  extends ShimFilePartitionReaderFactory(params) {
+class GpuHiveTextPartitionReaderFactory(
+    val sqlConf: SQLConf,
+    val broadcastConf: Broadcast[SerializableConfiguration],
+    val inputFileSchema: StructType,
+    val partitionSchema: StructType,
+    val requestedOutputDataSchema: StructType,
+    val requestedAttributes: Seq[Attribute],
+    val maxReaderBatchSizeRows: Integer,
+    val maxReaderBatchSizeBytes: Long,
+    val maxGpuColumnSizeBytes: Long,
+    val metrics: Map[String, GpuMetric],
+    val params: Map[String, String])
+  extends ShimFilePartitionReaderFactory(params) with Serializable {
 
   override def buildReader(partitionedFile: PartitionedFile): PartitionReader[InternalRow] = {
     throw new IllegalStateException("Row-based text parsing is not supported on GPU.")
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/HiveProviderImpl.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/HiveProviderImpl.scala
index 50f731c5fa0..f468fb7dcc7 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/HiveProviderImpl.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/hive/rapids/HiveProviderImpl.scala
@@ -48,7 +48,7 @@ class HiveProviderImpl extends HiveProviderCmdShims {
         ExprChecks.projectOnly(
           udfTypeSig,
           TypeSig.all,
-          repeatingParamCheck = Some(RepeatingParamCheck("param", udfTypeSig, TypeSig.all))),
+          repeatingParamCheck = Some(new RepeatingParamCheck("param", udfTypeSig, TypeSig.all))),
         (a, conf, p, r) => new ExprMeta[HiveSimpleUDF](a, conf, p, r) {
 
           val function = createFunction(a)
@@ -91,7 +91,7 @@ class HiveProviderImpl extends HiveProviderCmdShims {
         ExprChecks.projectOnly(
           udfTypeSig,
           TypeSig.all,
-          repeatingParamCheck = Some(RepeatingParamCheck("param", udfTypeSig, TypeSig.all))),
+          repeatingParamCheck = Some(new RepeatingParamCheck("param", udfTypeSig, TypeSig.all))),
         (a, conf, p, r) => new ExprMeta[HiveGenericUDF](a, conf, p, r) {
           val function = createFunction(a)
           private val opRapidsFunc = function match {
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala
new file mode 100644
index 00000000000..6270819dfe2
--- /dev/null
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala
@@ -0,0 +1,75 @@
+/*
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.nvidia
+
+import java.lang.reflect.Method
+
+import org.apache.spark.sql.Column
+import org.apache.spark.sql.catalyst.expressions.Expression
+
+object DFUDFShims {
+  private[this] lazy val classicColumnNodeConverter: Option[AnyRef] =
+    moduleFor("org.apache.spark.sql.classic.ColumnNodeToExpressionConverter$")
+
+  private[this] lazy val classicExpressionUtils: Option[AnyRef] =
+    moduleFor("org.apache.spark.sql.classic.ExpressionUtils$")
+
+  private[this] lazy val columnNodeMethod: Method =
+    classOf[Column].getMethod("node")
+
+  private[this] lazy val classicColumnNodeApplyMethod: Method =
+    classicColumnNodeConverter.get.getClass.getMethod("apply", columnNodeMethod.getReturnType)
+
+  private[this] lazy val classicExpressionColumnMethod: Method =
+    classicExpressionUtils.get.getClass.getMethod("column", classOf[Expression])
+
+  private[this] lazy val columnExprMethod: Method =
+    classOf[Column].getMethod("expr")
+
+  private[this] lazy val columnModule: AnyRef =
+    moduleFor("org.apache.spark.sql.Column$").get
+
+  private[this] lazy val columnApplyMethod: Method =
+    columnModule.getClass.getMethod("apply", classOf[Expression])
+
+  def columnToExpr(c: Column): Expression = {
+    classicColumnNodeConverter match {
+      case Some(converter) =>
+        val node = columnNodeMethod.invoke(c)
+        classicColumnNodeApplyMethod.invoke(converter, node).asInstanceOf[Expression]
+      case None =>
+        columnExprMethod.invoke(c).asInstanceOf[Expression]
+    }
+  }
+
+  def exprToColumn(e: Expression): Column = {
+    classicExpressionUtils match {
+      case Some(expressionUtils) =>
+        classicExpressionColumnMethod.invoke(expressionUtils, e).asInstanceOf[Column]
+      case None =>
+        columnApplyMethod.invoke(columnModule, e).asInstanceOf[Column]
+    }
+  }
+
+  private def moduleFor(className: String): Option[AnyRef] = {
+    try {
+      Some(Class.forName(className).getField("MODULE" + "$").get(null).asInstanceOf[AnyRef])
+    } catch {
+      case _: ClassNotFoundException => None
+    }
+  }
+}
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/LogicalPlanRules.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/LogicalPlanRules.scala
index 923d92572b5..e621b72b5e8 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/LogicalPlanRules.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/LogicalPlanRules.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -16,26 +16,65 @@
 
 package org.apache.spark.sql.nvidia
 
-import com.nvidia.spark.rapids.RapidsConf
-
-import org.apache.spark.internal.Logging
+import org.apache.spark.sql.Column
 import org.apache.spark.sql.catalyst.expressions.{Expression, ScalaUDF}
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.catalyst.rules.Rule
+import org.apache.spark.sql.internal.SQLConf
+
+object LogicalPlanRules {
+  private val dfUDFEnabledKey = "spark.rapids.sql.dfudf.enabled"
+
+  private def toBoolean(value: String, key: String): Boolean = {
+    try {
+      value.trim.toBoolean
+    } catch {
+      case _: IllegalArgumentException =>
+        throw new IllegalArgumentException(s"$key should be boolean, but was $value")
+    }
+  }
+
+  private def isDFUDFEnabled(conf: SQLConf): Boolean = {
+    val value = conf.getConfString(dfUDFEnabledKey, null)
+    if (value == null) {
+      true
+    } else {
+      toBoolean(value, dfUDFEnabledKey)
+    }
+  }
+
+  @transient private[this] lazy val dfUDFShimsModule = {
+    Class.forName("org.apache.spark.sql.nvidia.DFUDFShims" + "$")
+      .getField("MODULE" + "$")
+      .get(null)
+  }
+
+  @transient private[this] lazy val exprToColumnMethod =
+    dfUDFShimsModule.getClass.getMethod("exprToColumn", classOf[Expression])
+
+  @transient private[this] lazy val columnToExprMethod =
+    dfUDFShimsModule.getClass.getMethod("columnToExpr", classOf[Column])
+
+  private def exprToColumn(expr: Expression): Column =
+    exprToColumnMethod.invoke(dfUDFShimsModule, expr).asInstanceOf[Column]
+
+  private def columnToExpr(column: Column): Expression =
+    columnToExprMethod.invoke(dfUDFShimsModule, column).asInstanceOf[Expression]
+}
 
-case class LogicalPlanRules() extends Rule[LogicalPlan] with Logging {
+case class LogicalPlanRules() extends Rule[LogicalPlan] {
   val replacePartialFunc: PartialFunction[Expression, Expression] = {
     case f: ScalaUDF if DFUDF.getDFUDF(f.function).isDefined =>
       DFUDF.getDFUDF(f.function).map {
-        dfudf => DFUDFShims.columnToExpr(
-          dfudf(f.children.map(DFUDFShims.exprToColumn(_)).toArray))
+        dfudf => LogicalPlanRules.columnToExpr(
+          dfudf(f.children.map(LogicalPlanRules.exprToColumn(_)).toArray))
       }.getOrElse{
         throw new IllegalStateException("Inconsistent results when extracting df_udf")
       }
   }
 
   override def apply(plan: LogicalPlan): LogicalPlan = {
-    if (RapidsConf.DFUDF_ENABLED.get(plan.conf)) {
+    if (LogicalPlanRules.isDFUDFEnabled(plan.conf)) {
       plan.transformExpressions(replacePartialFunc)
     } else {
       plan
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/dataframe_udfs.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/dataframe_udfs.scala
index 79f71ba4ca0..e5187b2a300 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/dataframe_udfs.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/nvidia/dataframe_udfs.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -26,7 +26,7 @@ trait DFUDF {
   def apply(input: Array[Column]): Column
 }
 
-case class DFUDF0(f: Function0[Column])
+class DFUDF0(val f: Function0[Column])
   extends UDF0[Any] with DFUDF {
   override def call(): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -38,7 +38,7 @@ case class DFUDF0(f: Function0[Column])
   }
 }
 
-case class DFUDF1(f: Function1[Column, Column])
+class DFUDF1(val f: Function1[Column, Column])
   extends UDF1[Any, Any] with DFUDF {
   override def call(t1: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -50,7 +50,7 @@ case class DFUDF1(f: Function1[Column, Column])
   }
 }
 
-case class DFUDF2(f: Function2[Column, Column, Column])
+class DFUDF2(val f: Function2[Column, Column, Column])
   extends UDF2[Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -62,7 +62,7 @@ case class DFUDF2(f: Function2[Column, Column, Column])
   }
 }
 
-case class DFUDF3(f: Function3[Column, Column, Column, Column])
+class DFUDF3(val f: Function3[Column, Column, Column, Column])
   extends UDF3[Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -74,7 +74,7 @@ case class DFUDF3(f: Function3[Column, Column, Column, Column])
   }
 }
 
-case class DFUDF4(f: Function4[Column, Column, Column, Column, Column])
+class DFUDF4(val f: Function4[Column, Column, Column, Column, Column])
   extends UDF4[Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -86,7 +86,7 @@ case class DFUDF4(f: Function4[Column, Column, Column, Column, Column])
   }
 }
 
-case class DFUDF5(f: Function5[Column, Column, Column, Column, Column, Column])
+class DFUDF5(val f: Function5[Column, Column, Column, Column, Column, Column])
   extends UDF5[Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -98,7 +98,7 @@ case class DFUDF5(f: Function5[Column, Column, Column, Column, Column, Column])
   }
 }
 
-case class DFUDF6(f: Function6[Column, Column, Column, Column, Column, Column, Column])
+class DFUDF6(val f: Function6[Column, Column, Column, Column, Column, Column, Column])
   extends UDF6[Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -110,7 +110,7 @@ case class DFUDF6(f: Function6[Column, Column, Column, Column, Column, Column, C
   }
 }
 
-case class DFUDF7(f: Function7[Column, Column, Column, Column, Column, Column, Column, Column])
+class DFUDF7(val f: Function7[Column, Column, Column, Column, Column, Column, Column, Column])
   extends UDF7[Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -122,7 +122,7 @@ case class DFUDF7(f: Function7[Column, Column, Column, Column, Column, Column, C
   }
 }
 
-case class DFUDF8(f: Function8[Column, Column, Column, Column, Column, Column, Column, Column,
+class DFUDF8(val f: Function8[Column, Column, Column, Column, Column, Column, Column, Column,
   Column])
   extends UDF8[Any, Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any, t8: Any): Any = {
@@ -135,7 +135,7 @@ case class DFUDF8(f: Function8[Column, Column, Column, Column, Column, Column, C
   }
 }
 
-case class DFUDF9(f: Function9[Column, Column, Column, Column, Column, Column, Column, Column,
+class DFUDF9(val f: Function9[Column, Column, Column, Column, Column, Column, Column, Column,
   Column, Column])
   extends UDF9[Any, Any, Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any, t8: Any,
@@ -149,7 +149,7 @@ case class DFUDF9(f: Function9[Column, Column, Column, Column, Column, Column, C
   }
 }
 
-case class DFUDF10(f: Function10[Column, Column, Column, Column, Column, Column, Column, Column,
+class DFUDF10(val f: Function10[Column, Column, Column, Column, Column, Column, Column, Column,
   Column, Column, Column])
   extends UDF10[Any, Any, Any, Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any, t8: Any,
@@ -164,7 +164,7 @@ case class DFUDF10(f: Function10[Column, Column, Column, Column, Column, Column,
   }
 }
 
-case class JDFUDF0(f: UDF0[Column])
+class JDFUDF0(val f: UDF0[Column])
   extends UDF0[Any] with DFUDF {
   override def call(): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -176,7 +176,7 @@ case class JDFUDF0(f: UDF0[Column])
   }
 }
 
-case class JDFUDF1(f: UDF1[Column, Column])
+class JDFUDF1(val f: UDF1[Column, Column])
   extends UDF1[Any, Any] with DFUDF {
   override def call(t1: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -188,7 +188,7 @@ case class JDFUDF1(f: UDF1[Column, Column])
   }
 }
 
-case class JDFUDF2(f: UDF2[Column, Column, Column])
+class JDFUDF2(val f: UDF2[Column, Column, Column])
   extends UDF2[Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -200,7 +200,7 @@ case class JDFUDF2(f: UDF2[Column, Column, Column])
   }
 }
 
-case class JDFUDF3(f: UDF3[Column, Column, Column, Column])
+class JDFUDF3(val f: UDF3[Column, Column, Column, Column])
   extends UDF3[Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -212,7 +212,7 @@ case class JDFUDF3(f: UDF3[Column, Column, Column, Column])
   }
 }
 
-case class JDFUDF4(f: UDF4[Column, Column, Column, Column, Column])
+class JDFUDF4(val f: UDF4[Column, Column, Column, Column, Column])
   extends UDF4[Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -224,7 +224,7 @@ case class JDFUDF4(f: UDF4[Column, Column, Column, Column, Column])
   }
 }
 
-case class JDFUDF5(f: UDF5[Column, Column, Column, Column, Column, Column])
+class JDFUDF5(val f: UDF5[Column, Column, Column, Column, Column, Column])
   extends UDF5[Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -236,7 +236,7 @@ case class JDFUDF5(f: UDF5[Column, Column, Column, Column, Column, Column])
   }
 }
 
-case class JDFUDF6(f: UDF6[Column, Column, Column, Column, Column, Column, Column])
+class JDFUDF6(val f: UDF6[Column, Column, Column, Column, Column, Column, Column])
   extends UDF6[Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -248,7 +248,7 @@ case class JDFUDF6(f: UDF6[Column, Column, Column, Column, Column, Column, Colum
   }
 }
 
-case class JDFUDF7(f: UDF7[Column, Column, Column, Column, Column, Column, Column, Column])
+class JDFUDF7(val f: UDF7[Column, Column, Column, Column, Column, Column, Column, Column])
   extends UDF7[Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any): Any = {
     throw new IllegalStateException("TODO better error message. This should have been replaced")
@@ -260,7 +260,7 @@ case class JDFUDF7(f: UDF7[Column, Column, Column, Column, Column, Column, Colum
   }
 }
 
-case class JDFUDF8(f: UDF8[Column, Column, Column, Column, Column, Column, Column, Column,
+class JDFUDF8(val f: UDF8[Column, Column, Column, Column, Column, Column, Column, Column,
   Column])
   extends UDF8[Any, Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any, t8: Any): Any = {
@@ -273,7 +273,7 @@ case class JDFUDF8(f: UDF8[Column, Column, Column, Column, Column, Column, Colum
   }
 }
 
-case class JDFUDF9(f: UDF9[Column, Column, Column, Column, Column, Column, Column, Column,
+class JDFUDF9(val f: UDF9[Column, Column, Column, Column, Column, Column, Column, Column,
   Column, Column])
   extends UDF9[Any, Any, Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any, t8: Any,
@@ -287,7 +287,7 @@ case class JDFUDF9(f: UDF9[Column, Column, Column, Column, Column, Column, Colum
   }
 }
 
-case class JDFUDF10(f: UDF10[Column, Column, Column, Column, Column, Column, Column, Column,
+class JDFUDF10(val f: UDF10[Column, Column, Column, Column, Column, Column, Column, Column,
   Column, Column, Column])
   extends UDF10[Any, Any, Any, Any, Any, Any, Any, Any, Any, Any, Any] with DFUDF {
   override def call(t1: Any, t2: Any, t3: Any, t4: Any, t5: Any, t6: Any, t7: Any, t8: Any,
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/AvroProviderImpl.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/AvroProviderImpl.scala
index ff9ebaaff68..ac235f9310d 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/AvroProviderImpl.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/AvroProviderImpl.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -61,7 +61,7 @@ class AvroProviderImpl extends AvroProvider {
       pushedFilters: Array[Filter],
       fileScan: GpuFileSourceScanExec): PartitionReaderFactory = {
     val poolConfBuilder = ThreadPoolConfBuilder(fileScan.rapidsConf)
-    GpuAvroMultiFilePartitionReaderFactory(
+    new GpuAvroMultiFilePartitionReaderFactory(
       fileScan.relation.sparkSession.sessionState.conf,
       fileScan.rapidsConf,
       broadcastedConf,
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BasicColumnarWriteStatsTracker.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BasicColumnarWriteStatsTracker.scala
index 85707aad5fc..142d1df9e7a 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BasicColumnarWriteStatsTracker.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BasicColumnarWriteStatsTracker.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -26,7 +26,6 @@ import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.{FileSystem, Path}
 
 import org.apache.spark.{SparkContext, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.execution.SQLExecution
 import org.apache.spark.sql.execution.datasources.WriteTaskStats
@@ -35,19 +34,6 @@ import org.apache.spark.sql.rapids.BasicColumnarWriteJobStatsTracker._
 import org.apache.spark.sql.vectorized.ColumnarBatch
 import org.apache.spark.util.SerializableConfiguration
 
-/**
- * Simple metrics collected during an instance of [[GpuFileFormatDataWriter]].
- * These were first introduced in https://github.com/apache/spark/pull/18159 (SPARK-20703).
- */
-case class BasicColumnarWriteTaskStats(
-    partitions: Seq[InternalRow],
-    numFiles: Int,
-    numWriters: Int,
-    numBytes: Long,
-    numRows: Long)
-    extends WriteTaskStats
-
-
 /**
  * Simple metrics collected during an instance of [[GpuFileFormatDataWriter]].
  * This is the columnar version of
@@ -56,7 +42,20 @@ case class BasicColumnarWriteTaskStats(
 class BasicColumnarWriteTaskStatsTracker(
     hadoopConf: Configuration,
     taskCommitTimeMetric: Option[GpuMetric])
-    extends ColumnarWriteTaskStatsTracker with Logging {
+    extends ColumnarWriteTaskStatsTracker {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[BasicColumnarWriteTaskStatsTracker])
+
+  private def logInfo(msg: => String): Unit = if (log.isInfoEnabled) log.info(msg)
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
+
+  private def logDebug(msg: => String, throwable: Throwable): Unit = {
+    if (log.isDebugEnabled) log.debug(msg, throwable)
+  }
+
   private[this] val partitions: mutable.ArrayBuffer[InternalRow] = mutable.ArrayBuffer.empty
   private[this] var numFiles: Int = 0
   private[this] var numSubmittedFiles: Int = 0
@@ -186,7 +185,7 @@ class BasicColumnarWriteTaskStatsTracker(
         "or files being not immediately visible in the filesystem.")
     }
     taskCommitTimeMetric.foreach(_ += taskCommitTime)
-    BasicColumnarWriteTaskStats(partitions.toSeq, numFiles, maxNumWriters, numBytes, numRows)
+    new BasicColumnarWriteTaskStats(partitions.toSeq, numFiles, maxNumWriters, numBytes, numRows)
   }
 }
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BridgeGenerateUnsafeProjection.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BridgeGenerateUnsafeProjection.scala
index fbdc197ce80..ea64ccb4b71 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BridgeGenerateUnsafeProjection.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/BridgeGenerateUnsafeProjection.scala
@@ -16,6 +16,8 @@
 
 package org.apache.spark.sql.rapids
 
+import scala.util.control.NonFatal
+
 import com.nvidia.spark.rapids.RapidsHostColumnBuilder
 
 import org.apache.spark.sql.catalyst.InternalRow
@@ -65,17 +67,48 @@ class InterpretedBridgeUnsafeProjection(expressions: Seq[Expression])
 /**
  * The factory object for `UnsafeProjection`.
  */
-object BridgeUnsafeProjection
-  extends CodeGeneratorWithInterpretedFallback[Seq[Expression], BridgeUnsafeProjection] {
+object BridgeUnsafeProjection {
+
+  def createOptimizedAppendFunction(dataType: DataType,
+    nullable: Boolean): (Any, RapidsHostColumnBuilder) => Unit = {
+    BridgeUnsafeProjectionCodegen.createOptimizedAppendFunction(dataType, nullable)
+  }
+
+  def create(schema: StructType): BridgeUnsafeProjection = create(schema.fields.map(_.dataType))
+
+  def create(fields: Array[DataType]): BridgeUnsafeProjection = {
+    create(fields.zipWithIndex.map(x => BoundReference(x._2, x._1, true)))
+  }
+
+  def create(exprs: Seq[Expression]): BridgeUnsafeProjection = {
+    BridgeUnsafeProjectionCodegen.create(exprs)
+  }
+
+  def create(expr: Expression): BridgeUnsafeProjection = create(Seq(expr))
+
+  def create(exprs: Seq[Expression], inputSchema: Seq[Attribute]): BridgeUnsafeProjection = {
+    create(bindReferences(exprs, inputSchema))
+  }
+}
+
+private object BridgeUnsafeProjectionCodegen {
+  private[this] val log = org.slf4j.LoggerFactory.getLogger(getClass)
+
+  private def createObject(in: Seq[Expression]): BridgeUnsafeProjection = {
+    try {
+      createCodeGeneratedObject(in)
+    } catch {
+      case NonFatal(e) =>
+        log.warn("Expr codegen error and falling back to interpreter mode", e)
+        createInterpretedObject(in)
+    }
+  }
 
-  override protected def createCodeGeneratedObject(in: Seq[Expression]): BridgeUnsafeProjection = {
-    // Just call generate directly - let any exceptions propagate naturally
-    // The CodeGeneratorWithInterpretedFallback base class will catch exceptions 
-    // and fall back to createInterpretedObject
+  private def createCodeGeneratedObject(in: Seq[Expression]): BridgeUnsafeProjection = {
     BridgeGenerateUnsafeProjection.generate(in, SQLConf.get.subexpressionEliminationEnabled)
   }
 
-  override protected def createInterpretedObject(in: Seq[Expression]): BridgeUnsafeProjection = {
+  private def createInterpretedObject(in: Seq[Expression]): BridgeUnsafeProjection = {
     new InterpretedBridgeUnsafeProjection(in)
   }
 
@@ -238,8 +271,8 @@ object BridgeUnsafeProjection
  *
  * @note The returned UnsafeRow will be pointed to a scratch buffer inside the projection.
  */
-object BridgeGenerateUnsafeProjection extends
-  CodeGenerator[Seq[Expression], BridgeUnsafeProjection] {
+object BridgeGenerateUnsafeProjection {
+  private val codegenLog = org.slf4j.LoggerFactory.getLogger(getClass)
 
   case class Schema(dataType: DataType, nullable: Boolean)
 
@@ -547,6 +580,18 @@ object BridgeGenerateUnsafeProjection extends
   protected def bind(in: Seq[Expression], inputSchema: Seq[Attribute]): Seq[Expression] =
     bindReferences(in, inputSchema)
 
+  def newCodeGenContext(): CodegenContext = new CodegenContext
+
+  def generate(expressions: Seq[Expression]): BridgeUnsafeProjection = {
+    create(canonicalize(expressions))
+  }
+
+  def generate(
+      expressions: Seq[Expression],
+      inputSchema: Seq[Attribute]): BridgeUnsafeProjection = {
+    generate(bind(expressions, inputSchema))
+  }
+
   def generate(
       expressions: Seq[Expression],
       subexpressionEliminationEnabled: Boolean): BridgeUnsafeProjection = {
@@ -640,7 +685,9 @@ object BridgeGenerateUnsafeProjection extends
 
     val code = CodeFormatter.stripOverlappingComments(
       new CodeAndComment(codeBody, ctx.getPlaceHolderToComments()))
-    logDebug(s"code for ${expressions.mkString(",")}:\n${CodeFormatter.format(code)}")
+    if (codegenLog.isDebugEnabled) {
+      codegenLog.debug(s"code for ${expressions.mkString(",")}:\n${CodeFormatter.format(code)}")
+    }
 
     val (clazz, _) = CodeGenerator.compile(code)
     clazz.generate(ctx.references.toArray).asInstanceOf[BridgeUnsafeProjection]
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ExternalSource.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ExternalSource.scala
index cae457272e8..11d6baa6691 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ExternalSource.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ExternalSource.scala
@@ -23,7 +23,6 @@ import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.delta.DeltaProvider
 import com.nvidia.spark.rapids.iceberg.IcebergProvider
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.expressions.objects.StaticInvoke
 import org.apache.spark.sql.connector.catalog.SupportsWrite
@@ -40,7 +39,11 @@ import org.apache.spark.util.Utils
  * spark-avro classes because `class not found` exception may throw if spark-avro does not
  * exist at runtime. Details see: https://github.com/NVIDIA/spark-rapids/issues/5648
  */
-trait ExternalSourceBase extends Logging {
+trait ExternalSourceBase {
+  @transient private lazy val log = org.slf4j.LoggerFactory.getLogger(classOf[ExternalSourceBase])
+
+  private def logWarning(msg: => String): Unit = if (log.isWarnEnabled) log.warn(msg)
+
   val avroScanClassName = "org.apache.spark.sql.v2.avro.AvroScan"
   lazy val hasSparkAvroJar = {
     /** spark-avro is an optional package for Spark, so the RAPIDS Accelerator
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuAvroScan.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuAvroScan.scala
index a86120a7fad..ccf8c14242b 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuAvroScan.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuAvroScan.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -40,7 +40,6 @@ import org.apache.hadoop.fs.{FSDataInputStream, Path}
 
 import org.apache.spark.TaskContext
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.avro.{AvroOptions, SchemaConverters}
 import org.apache.spark.sql.catalyst.InternalRow
@@ -119,12 +118,12 @@ case class GpuAvroScan(
     // The partition values are already truncated in `FileScan.partitions`.
     // We should use `readPartitionSchema` as the partition schema here.
     if (rapidsConf.isAvroPerFileReadEnabled) {
-      GpuAvroPartitionReaderFactory(sparkSession.sessionState.conf, rapidsConf, broadcastedConf,
+      new GpuAvroPartitionReaderFactory(sparkSession.sessionState.conf, rapidsConf, broadcastedConf,
         dataSchema, readDataSchema, readPartitionSchema, parsedOptions, metrics,
         options.asScala.toMap)
     } else {
       val poolConfBuilder = ThreadPoolConfBuilder(rapidsConf)
-      GpuAvroMultiFilePartitionReaderFactory(sparkSession.sessionState.conf,
+      new GpuAvroMultiFilePartitionReaderFactory(sparkSession.sessionState.conf,
         rapidsConf, broadcastedConf, dataSchema, readDataSchema, readPartitionSchema,
         parsedOptions, metrics, pushedFilters, poolConfBuilder, queryUsesInputFile)
     }
@@ -152,7 +151,7 @@ case class GpuAvroScan(
 }
 
 /** Avro partition reader factory to build columnar reader */
-case class GpuAvroPartitionReaderFactory(
+class GpuAvroPartitionReaderFactory(
     @transient sqlConf: SQLConf,
     @transient rapidsConf: RapidsConf,
     broadcastedConf: Broadcast[SerializableConfiguration],
@@ -162,7 +161,7 @@ case class GpuAvroPartitionReaderFactory(
     avroOptions: AvroOptions,
     metrics: Map[String, GpuMetric],
     @transient params: Map[String, String])
-  extends ShimFilePartitionReaderFactory(params) with Logging {
+  extends ShimFilePartitionReaderFactory(params) with RapidsLocalLog with Serializable {
 
   private val debugDumpPrefix = rapidsConf.avroDebugDumpPrefix
   private val debugDumpAlways = rapidsConf.avroDebugDumpAlways
@@ -179,7 +178,7 @@ case class GpuAvroPartitionReaderFactory(
   override def buildColumnarReader(partFile: PartitionedFile): PartitionReader[ColumnarBatch] = {
     val conf = broadcastedConf.value.value
     val startTime = System.nanoTime()
-    val blockMeta = AvroFileFilterHandler(conf, avroOptions).filterBlocks(partFile)
+    val blockMeta = new AvroFileFilterHandler(conf, avroOptions).filterBlocks(partFile)
     metrics.get(FILTER_TIME).foreach {
       _ += (System.nanoTime() - startTime)
     }
@@ -194,7 +193,7 @@ case class GpuAvroPartitionReaderFactory(
 /**
  * The multi-file partition reader factory for cloud or coalescing reading of avro file format.
  */
-case class GpuAvroMultiFilePartitionReaderFactory(
+class GpuAvroMultiFilePartitionReaderFactory(
     @transient sqlConf: SQLConf,
     @transient rapidsConf: RapidsConf,
     broadcastedConf: Broadcast[SerializableConfiguration],
@@ -206,7 +205,8 @@ case class GpuAvroMultiFilePartitionReaderFactory(
     filters: Array[Filter],
     poolConfBuilder: ThreadPoolConfBuilder,
     queryUsesInputFile: Boolean)
-  extends MultiFilePartitionReaderFactoryBase(sqlConf, broadcastedConf, rapidsConf) {
+  extends MultiFilePartitionReaderFactoryBase(sqlConf, broadcastedConf, rapidsConf)
+      with Serializable {
 
   private val debugDumpPrefix = rapidsConf.avroDebugDumpPrefix
   private val debugDumpAlways = rapidsConf.avroDebugDumpAlways
@@ -269,7 +269,7 @@ case class GpuAvroMultiFilePartitionReaderFactory(
       conf: Configuration): PartitionReader[ColumnarBatch] = {
     val clippedBlocks = ArrayBuffer[AvroSingleDataBlockInfo]()
     val mapPathHeader = LinkedHashMap[Path, Header]()
-    val filterHandler = AvroFileFilterHandler(conf, options)
+    val filterHandler = new AvroFileFilterHandler(conf, options)
 
     metrics.getOrElse(FILTER_TIME, NoopMetric).ns {
       metrics.getOrElse(SCAN_TIME, NoopMetric).ns {
@@ -279,23 +279,23 @@ case class GpuAvroMultiFilePartitionReaderFactory(
           } catch {
             case e: FileNotFoundException if ignoreMissingFiles =>
               logWarning(s"Skipped missing file: ${file.filePath}", e)
-              AvroBlockMeta(null, 0L, Seq.empty)
+              new AvroBlockMeta(null, 0L, Seq.empty)
             // Throw FileNotFoundException even if `ignoreCorruptFiles` is true
             case e: FileNotFoundException if !ignoreMissingFiles => throw e
             case e@(_: RuntimeException | _: IOException) if ignoreCorruptFiles =>
               logWarning(
                 s"Skipped the rest of the content in the corrupted file: ${file.filePath}", e)
-              AvroBlockMeta(null, 0L, Seq.empty)
+              new AvroBlockMeta(null, 0L, Seq.empty)
           }
           val fPath = new Path(new URI(file.filePath.toString()))
           clippedBlocks ++= singleFileInfo.blocks.map(block =>
-            AvroSingleDataBlockInfo(
+            new AvroSingleDataBlockInfo(
               fPath,
-              AvroDataBlock(block),
+              new AvroDataBlock(block),
               file.partitionValues,
-              AvroSchemaWrapper(SchemaConverters.toAvroType(readDataSchema)),
+              new AvroSchemaWrapper(SchemaConverters.toAvroType(readDataSchema)),
               readDataSchema,
-              AvroExtraInfo()))
+              new AvroExtraInfo()))
           if (singleFileInfo.blocks.nonEmpty) {
             // No need to check the header since it can not be null when blocks is not empty here.
             mapPathHeader.put(fPath, singleFileInfo.header)
@@ -312,7 +312,7 @@ case class GpuAvroMultiFilePartitionReaderFactory(
 }
 
 /** A trait collecting common methods across the 3 kinds of avro readers */
-trait GpuAvroReaderBase extends Logging { self: FilePartitionReaderBase =>
+trait GpuAvroReaderBase extends RapidsLocalLog { self: FilePartitionReaderBase =>
   def debugDumpPrefix: Option[String]
 
   def debugDumpAlways: Boolean
@@ -452,7 +452,7 @@ trait GpuAvroReaderBase extends Logging { self: FilePartitionReaderBase =>
       withResource(partFilePath.getFileSystem(conf).open(partFilePath)) { in =>
         closeOnExcept(HostMemoryBuffer.allocate(estOutSize)) { hmb =>
           withResource(new HostMemoryOutputStream(hmb)) { out =>
-            val headerAndBlocks = BlockInfo(0, headerSize, 0, 0) +: blocks
+            val headerAndBlocks = new BlockInfo(0, headerSize, 0, 0) +: blocks
             copyBlocksData(headerAndBlocks, in, out)
             // check we didn't go over memory
             if (out.getPos > estOutSize) {
@@ -487,7 +487,7 @@ trait GpuAvroReaderBase extends Logging { self: FilePartitionReaderBase =>
       // Copy every block without the tailing sync marker if a sync is given. This
       // is for coalescing reader who requires to append this given sync marker
       // to each block. Then we can not merge sequential blocks.
-      blocks.map(b => CopyRange(b.blockStart, b.blockSize - SYNC_SIZE))
+      blocks.map(b => new CopyRange(b.blockStart, b.blockSize - SYNC_SIZE))
     }.getOrElse(computeCopyRanges(blocks))
 
     val copySyncFunc: OutputStream => Unit = if (sync.isEmpty) {
@@ -535,7 +535,7 @@ trait GpuAvroReaderBase extends Logging { self: FilePartitionReaderBase =>
     blocks.foreach { block =>
       if (currentCopyEnd != block.blockStart) {
         if (currentCopyEnd != 0) {
-          copyRanges.append(CopyRange(currentCopyStart, currentCopyEnd - currentCopyStart))
+          copyRanges.append(new CopyRange(currentCopyStart, currentCopyEnd - currentCopyStart))
         }
         currentCopyStart = block.blockStart
         currentCopyEnd = currentCopyStart
@@ -544,7 +544,7 @@ trait GpuAvroReaderBase extends Logging { self: FilePartitionReaderBase =>
     }
 
     if (currentCopyEnd != currentCopyStart) {
-      copyRanges.append(CopyRange(currentCopyStart, currentCopyEnd - currentCopyStart))
+      copyRanges.append(new CopyRange(currentCopyStart, currentCopyEnd - currentCopyStart))
     }
     copyRanges.toSeq
   }
@@ -696,7 +696,8 @@ class GpuMultiFileCloudAvroPartitionReader(
       closeOnExcept(batchIter) { _ =>
         if (bufsAndSizes.length > 1) {
           val updatedBuffers = bufsAndSizes.drop(1)
-          currentFileHostBuffers = Some(buffer.copy(memBuffersAndSizes = updatedBuffers))
+          currentFileHostBuffers = Some(new AvroHostBuffersWithMeta(
+            buffer.partitionedFile, updatedBuffers, buffer.bytesRead))
         } else {
           currentFileHostBuffers = None
         }
@@ -717,7 +718,7 @@ class GpuMultiFileCloudAvroPartitionReader(
     new ReadBatchRunner(tc, file, config, filters)
 
   /** Two utils classes */
-  private case class AvroHostBuffersWithMeta(
+  private class AvroHostBuffersWithMeta(
     override val partitionedFile: PartitionedFile,
     override val memBuffersAndSizes: Array[SingleHMBAndMeta],
     override val bytesRead: Long) extends HostMemoryBuffersWithMetaDataBase
@@ -726,7 +727,7 @@ class GpuMultiFileCloudAvroPartitionReader(
       taskContext: TaskContext,
       partFile: PartitionedFile,
       config: Configuration,
-      filters: Array[Filter]) extends UnboundedAsyncRunner[BufferInfo] with Logging {
+      filters: Array[Filter]) extends UnboundedAsyncRunner[BufferInfo] with RapidsLocalLog {
 
     override def callImpl(): BufferInfo = {
       TrampolineUtil.setTaskContext(taskContext)
@@ -737,13 +738,13 @@ class GpuMultiFileCloudAvroPartitionReader(
       } catch {
         case e: FileNotFoundException if ignoreMissingFiles =>
           logWarning(s"Skipped missing file: ${partFile.filePath}", e)
-          AvroHostBuffersWithMeta(partFile, Array(SingleHMBAndMeta.empty()), 0)
+          new AvroHostBuffersWithMeta(partFile, Array(SingleHMBAndMeta.empty()), 0)
         // Throw FileNotFoundException even if `ignoreCorruptFiles` is true
         case e: FileNotFoundException if !ignoreMissingFiles => throw e
         case e @(_: RuntimeException | _: IOException) if ignoreCorruptFiles =>
           logWarning(
             s"Skipped the rest of the content in the corrupted file: ${partFile.filePath}", e)
-          AvroHostBuffersWithMeta(partFile, Array(SingleHMBAndMeta.empty()), 0)
+          new AvroHostBuffersWithMeta(partFile, Array(SingleHMBAndMeta.empty()), 0)
       } finally {
         RmmSpark.poolThreadFinishedForTask(taskContext.taskAttemptId())
         TrampolineUtil.unsetTaskContext()
@@ -754,7 +755,7 @@ class GpuMultiFileCloudAvroPartitionReader(
         arrayBufSize: Array[SingleHMBAndMeta],
         startingBytesRead: Long): HostMemoryBuffersWithMetaDataBase = {
       val bytesRead = fileSystemBytesRead() - startingBytesRead
-      AvroHostBuffersWithMeta(partFile, arrayBufSize, bytesRead)
+      new AvroHostBuffersWithMeta(partFile, arrayBufSize, bytesRead)
     }
 
     private val stopPosition = partFile.start + partFile.length
@@ -944,7 +945,7 @@ class GpuMultiFileAvroPartitionReader(
     // in 'checkIfNeedToSplitDataBlock'
     val mergedHeader = Header.mergeMetadata(headers.toSeq)
     assert(mergedHeader.nonEmpty, "No header exists")
-    AvroBatchContext(chunkedBlocks, clippedSchema, mergedHeader.get)
+    new AvroBatchContext(chunkedBlocks, clippedSchema, mergedHeader.get)
   }
 
   override def calculateEstimatedBlocksOutputSize(batchContext: BatchContext): Long = {
@@ -1044,7 +1045,7 @@ class GpuMultiFileAvroPartitionReader(
     blocks.map(toBlockInfo(_))
 
   implicit def toBlockBases(blocks: Seq[BlockInfo]): Seq[DataBlockBase] =
-    blocks.map(AvroDataBlock(_))
+    blocks.map(new AvroDataBlock(_))
 
   implicit def toAvroExtraInfo(in: ExtraInfo): AvroExtraInfo =
     in.asInstanceOf[AvroExtraInfo]
@@ -1055,9 +1056,9 @@ class GpuMultiFileAvroPartitionReader(
 }
 
 /** A tool to filter Avro blocks */
-case class AvroFileFilterHandler(
+class AvroFileFilterHandler(
     hadoopConf: Configuration,
-    @transient options: AvroOptions) extends Logging {
+    options: AvroOptions) extends RapidsLocalLog with Serializable {
 
   @scala.annotation.nowarn(
     "msg=value ignoreExtension in class AvroOptions is deprecated*"
@@ -1071,10 +1072,10 @@ case class AvroFileFilterHandler(
         // Get blocks only belong to this split
         reader.sync(partFile.start)
         val partBlocks = reader.getPartialBlocks(partFile.start + partFile.length)
-        AvroBlockMeta(reader.header, reader.headerSize, partBlocks)
+        new AvroBlockMeta(reader.header, reader.headerSize, partBlocks)
       }
     } else {
-      AvroBlockMeta(null, 0L, Seq.empty)
+      new AvroBlockMeta(null, 0L, Seq.empty)
     }
   }
 }
@@ -1085,7 +1086,8 @@ case class AvroFileFilterHandler(
  * @param header the header of avro file
  * @param blocks the total block info of avro file
  */
-case class AvroBlockMeta(header: Header, headerSize: Long, blocks: Seq[BlockInfo])
+class AvroBlockMeta(val header: Header, val headerSize: Long, val blocks: Seq[BlockInfo])
+  extends Serializable
 
 /**
  * CopyRange to indicate from where to copy.
@@ -1093,32 +1095,32 @@ case class AvroBlockMeta(header: Header, headerSize: Long, blocks: Seq[BlockInfo
  * @param offset from where to copy
  * @param length how many bytes to copy
  */
-private case class CopyRange(offset: Long, length: Long)
+private class CopyRange(val offset: Long, val length: Long)
 
 /** Extra information */
-case class AvroExtraInfo() extends ExtraInfo
+class AvroExtraInfo extends ExtraInfo with Serializable
 
 /** avro schema wrapper */
-case class AvroSchemaWrapper(schema: Schema) extends SchemaBase {
+class AvroSchemaWrapper(val schema: Schema) extends SchemaBase with Serializable {
   override def isEmpty: Boolean = schema.getFields.isEmpty
 }
 
 /** avro BlockInfo wrapper */
-case class AvroDataBlock(blockInfo: BlockInfo) extends DataBlockBase {
+class AvroDataBlock(val blockInfo: BlockInfo) extends DataBlockBase with Serializable {
   override def getRowCount: Long = blockInfo.count
   override def getReadDataSize: Long = blockInfo.dataSize
   override def getBlockSize: Long = blockInfo.blockSize
 }
 
-case class AvroSingleDataBlockInfo(
-  filePath: Path,
-  dataBlock: AvroDataBlock,
-  partitionValues: InternalRow,
-  schema: AvroSchemaWrapper,
-  readSchema: StructType,
-  extraInfo: AvroExtraInfo) extends SingleDataBlockInfo
+class AvroSingleDataBlockInfo(
+  val filePath: Path,
+  val dataBlock: AvroDataBlock,
+  val partitionValues: InternalRow,
+  val schema: AvroSchemaWrapper,
+  val readSchema: StructType,
+  val extraInfo: AvroExtraInfo) extends SingleDataBlockInfo with Serializable
 
-case class AvroBatchContext(
+class AvroBatchContext(
   override val origChunkedBlocks: LinkedHashMap[Path, ArrayBuffer[DataBlockBase]],
   override val schema: SchemaBase,
-  mergedHeader: Header) extends BatchContext(origChunkedBlocks, schema)
+  val mergedHeader: Header) extends BatchContext(origChunkedBlocks, schema) with Serializable
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuDataSourceBase.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuDataSourceBase.scala
index 4c90da533c9..4c8b502ddc4 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuDataSourceBase.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuDataSourceBase.scala
@@ -21,7 +21,7 @@ import java.util.{Locale, ServiceConfigurationError, ServiceLoader}
 
 import scala.util.{Failure, Success, Try}
 
-import com.nvidia.spark.rapids.GpuParquetFileFormat
+import com.nvidia.spark.rapids.{GpuParquetFileFormat, RapidsLocalLog}
 import com.nvidia.spark.rapids.shims.SparkShimImpl
 import org.apache.commons.lang3.reflect.ConstructorUtils
 import org.apache.hadoop.conf.Configuration
@@ -29,7 +29,6 @@ import org.apache.hadoop.fs.Path
 
 import org.apache.spark.SparkException
 import org.apache.spark.deploy.SparkHadoopUtil
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql._
 import org.apache.spark.sql.catalyst.catalog.{BucketSpec, CatalogTable}
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
@@ -62,7 +61,7 @@ abstract class GpuDataSourceBase(
     bucketSpec: Option[BucketSpec] = None,
     options: Map[String, String] = Map.empty,
     catalogTable: Option[CatalogTable] = None,
-    origProvider: Class[_]) extends Logging {
+    origProvider: Class[_]) extends RapidsLocalLog {
 
   protected def originalProvidingInstance() = origProvider.getConstructor().newInstance()
 
@@ -311,7 +310,7 @@ abstract class GpuDataSourceBase(
   }
 }
 
-object GpuDataSourceBase extends Logging {
+object GpuDataSourceBase extends RapidsLocalLog {
 
   /** A map to maintain backward compatibility in case we move data sources around. */
   private val backwardCompatibilityMap: Map[String, String] = {
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriter.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriter.scala
index 4365bc109a3..f0c0a4de66b 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriter.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriter.scala
@@ -27,11 +27,11 @@ import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.RmmRapidsRetryIterator.withRetryNoSplit
 import com.nvidia.spark.rapids.fileio.hadoop.HadoopFileIO
+import com.nvidia.spark.rapids.fileio.hadoop.PerfIOHadoopInputFileFactory
 import com.nvidia.spark.rapids.shims.GpuFileFormatDataWriterShim
 import org.apache.hadoop.fs.Path
 import org.apache.hadoop.mapreduce.TaskAttemptContext
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.internal.io.FileCommitProtocol
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.catalog.{BucketSpec, ExternalCatalogUtils}
@@ -348,12 +348,12 @@ class GpuDynamicPartitionDataSingleWriter(
   }
 
   /**
-   * A case class to hold the batch, the optional partition values and the optional bucket
+   * A class to hold the batch, the optional partition values and the optional bucket
    * ID for a split group. All the rows in the batch belong to the group defined by the
    * partition values and the bucket ID.
    */
-  private case class SplitPack(split: SpillableColumnarBatch, partValues: Option[InternalRow],
-      bucketId: Option[Int]) extends AutoCloseable {
+  private class SplitPack(val split: SpillableColumnarBatch, val partValues: Option[InternalRow],
+      val bucketId: Option[Int]) extends AutoCloseable {
     override def close(): Unit = {
       split.safeClose()
     }
@@ -546,7 +546,7 @@ class GpuDynamicPartitionDataSingleWriter(
           val split = splits(idx)
           splits(idx) = null
           closeOnExcept(split) { _ =>
-            SplitPack(
+            new SplitPack(
               SpillableColumnarBatch(split, outDataTypes,
                 SpillPriorities.ACTIVE_BATCHING_PRIORITY),
               getNextPartValues(idx), getBucketId(idx))
@@ -673,7 +673,10 @@ class GpuDynamicPartitionDataSingleWriter(
     // The input batch that is entirely sorted, so split it up by partitions and (or)
     // bucket ids, and write the split batches one by one.
     withResource(splitBatchByKeyAndClose(batch)) { splitPacks =>
-      splitPacks.zipWithIndex.foreach { case (SplitPack(sp, partVals, bucketId), i) =>
+      splitPacks.zipWithIndex.foreach { case (pack, i) =>
+        val sp = pack.split
+        val partVals = pack.partValues
+        val bucketId = pack.bucketId
         val hasDiffPart = partVals != currentWriterId.partitionValues
         val hasDiffBucket = bucketId != currentWriterId.bucketId
         if (hasDiffPart || hasDiffBucket) {
@@ -719,7 +722,7 @@ class GpuDynamicPartitionDataConcurrentWriter(
     debugOutputBasePath: Option[String])
   extends GpuDynamicPartitionDataSingleWriter(description, taskAttemptContext,
     committer, debugOutputBasePath)
-  with Logging {
+  with RapidsLocalLog {
 
   /** Wrapper class for status and caches of a unique concurrent output writer. */
   private class WriterStatusWithBatches extends WriterAndStatus with AutoCloseable {
@@ -784,7 +787,7 @@ class GpuDynamicPartitionDataConcurrentWriter(
           (tt.sortTime, tt.sortOpTime)
         }.getOrElse((NoopMetric, NoopMetric))
 
-      val sortIter = GpuOutOfCoreSortIterator(pendingCbsIter ++ iterator,
+      val sortIter = new GpuOutOfCoreSortIterator(pendingCbsIter ++ iterator,
         new GpuSorter(spec.sortOrder, spec.output, Map.empty[String, GpuMetric]),
         GpuSortExec.targetSize(spec.batchSize),
         sortOpTime, sortMetric, NoopMetric, NoopMetric)
@@ -975,9 +978,9 @@ class GpuDynamicPartitionDataConcurrentWriter(
  * @param bucketIdExpression Expression to calculate bucket id based on bucket column(s).
  * @param bucketFileNamePrefix Prefix of output file name based on bucket id.
  */
-case class GpuWriterBucketSpec(
-  bucketIdExpression: GpuExpression,
-  bucketFileNamePrefix: Int => String)
+class GpuWriterBucketSpec(
+  val bucketIdExpression: GpuExpression,
+  val bucketFileNamePrefix: Int => String) extends Serializable
 
 /**
  * A shared job description for all the GPU write tasks.
@@ -999,7 +1002,9 @@ class GpuWriteJobDescription(
     val concurrentWriterPartitionFlushSize: Long)
   extends Serializable {
 
-  lazy val fileIO: HadoopFileIO = new HadoopFileIO(serializableHadoopConf.value)
+  lazy val fileIO: HadoopFileIO = new HadoopFileIO(
+    serializableHadoopConf.value,
+    PerfIOHadoopInputFileFactory.INSTANCE)
 
   assert(AttributeSet(allColumns) == AttributeSet(partitionColumns ++ dataColumns),
     s"""
@@ -1053,6 +1058,6 @@ object BucketIdMetaUtils {
     // The bucket file name prefix is following Hive, Presto and Trino conversion, then
     // Hive bucketed tables written by Plugin can be read by other SQL engines.
     val fileNamePrefix = (bucketId: Int) => f"$bucketId%05d_0_"
-    GpuWriterBucketSpec(bucketIdExpression, fileNamePrefix)
+    new GpuWriterBucketSpec(bucketIdExpression, fileNamePrefix)
   }
 }
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuOrcFileFormat.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuOrcFileFormat.scala
index 62e59a530dc..e98d9f1c072 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuOrcFileFormat.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuOrcFileFormat.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,7 +28,6 @@ import org.apache.orc.OrcConf
 import org.apache.orc.OrcConf._
 import org.apache.orc.mapred.OrcStruct
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.catalyst.util.CaseInsensitiveMap
 import org.apache.spark.sql.execution.datasources.FileFormat
@@ -37,7 +36,11 @@ import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.rapids.execution.TrampolineUtil
 import org.apache.spark.sql.types._
 
-object GpuOrcFileFormat extends Logging {
+object GpuOrcFileFormat {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = if (log.isInfoEnabled) log.info(msg)
+
   // The classname used when Spark is configured to use the Hive implementation for ORC.
   // Spark is not always compiled with Hive support so we cannot import from Spark jars directly.
   private val HIVE_IMPL_CLASS = "org.apache.spark.sql.hive.orc.OrcFileFormat"
@@ -162,7 +165,7 @@ object GpuOrcFileFormat extends Logging {
   }
 }
 
-class GpuOrcFileFormat extends ColumnarFileFormat with Logging {
+class GpuOrcFileFormat extends ColumnarFileFormat {
   /**
    * Prepares a write job and returns an `ColumnarOutputWriterFactory`.  Client side job
    * preparation can be put here.  For example, user defined output committer can be configured here
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuReadAvroFileFormat.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuReadAvroFileFormat.scala
index a3cc1e9dab6..70da695ef8b 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuReadAvroFileFormat.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuReadAvroFileFormat.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -53,7 +53,7 @@ class GpuReadAvroFileFormat extends AvroFileFormat with GpuReadFileFormatWithMet
     val broadcastedHadoopConf =
       sparkSession.sparkContext.broadcast(new SerializableConfiguration(hadoopConf))
 
-    val factory = GpuAvroPartitionReaderFactory(
+    val factory = new GpuAvroPartitionReaderFactory(
       sqlConf,
       new RapidsConf(sqlConf),
       broadcastedHadoopConf,
@@ -73,7 +73,7 @@ class GpuReadAvroFileFormat extends AvroFileFormat with GpuReadFileFormatWithMet
       pushedFilters: Array[Filter],
       fileScan: GpuFileSourceScanExec): PartitionReaderFactory = {
     val poolConfBuilder = ThreadPoolConfBuilder(fileScan.rapidsConf)
-    GpuAvroMultiFilePartitionReaderFactory(
+    new GpuAvroMultiFilePartitionReaderFactory(
       fileScan.relation.sparkSession.sessionState.conf,
       fileScan.rapidsConf,
       broadcastedConf,
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuScalaUDF.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuScalaUDF.scala
index 11a8d2e9409..62f46684980 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuScalaUDF.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuScalaUDF.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -49,7 +49,7 @@ object GpuScalaUDFMeta {
       GpuUserDefinedFunction.udfTypeSig,
       TypeSig.all,
       repeatingParamCheck =
-        Some(RepeatingParamCheck("param", GpuUserDefinedFunction.udfTypeSig, TypeSig.all))),
+        Some(new RepeatingParamCheck("param", GpuUserDefinedFunction.udfTypeSig, TypeSig.all))),
     (expr, conf, p, r) => new ExprMeta(expr, conf, p, r) {
       lazy val opRapidsFunc = GpuScalaUDF.getRapidsUDFInstance(expr.function)
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuShuffleEnv.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuShuffleEnv.scala
index ecc5a1bb7f5..f3359696d63 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuShuffleEnv.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuShuffleEnv.scala
@@ -22,9 +22,22 @@ import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.shims.ShuffleManagerShimUtils
 
 import org.apache.spark.{SparkConf, SparkEnv}
-import org.apache.spark.internal.Logging
 
-class GpuShuffleEnv(rapidsConf: RapidsConf) extends Logging {
+class GpuShuffleEnv(rapidsConf: RapidsConf) {
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[GpuShuffleEnv])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
   private var shuffleCatalog: ShuffleBufferCatalog = _
   private var shuffleReceivedBufferCatalog: ShuffleReceivedBufferCatalog = _
   private var multithreadedCatalog: MultithreadedShuffleBufferCatalog = _
@@ -89,7 +102,7 @@ class GpuShuffleEnv(rapidsConf: RapidsConf) extends Logging {
   }
 }
 
-object GpuShuffleEnv extends Logging {
+object GpuShuffleEnv {
   def isUCXShuffleAndEarlyStart(conf: RapidsConf): Boolean = {
     conf.isUCXShuffleManagerMode &&
       conf.shuffleTransportEarlyStart
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuTaskMetrics.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuTaskMetrics.scala
index fe24d8f860b..763d408e9a2 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuTaskMetrics.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/GpuTaskMetrics.scala
@@ -18,57 +18,18 @@ package org.apache.spark.sql.rapids
 
 import java.{lang => jl}
 import java.io.ObjectInputStream
-import java.util.Locale
 import java.util.concurrent.ConcurrentHashMap
-import java.util.concurrent.TimeUnit
 import java.util.concurrent.atomic.AtomicLong
 
 import ai.rapids.cudf.{NvtxColor, NvtxRange}
-import com.nvidia.spark.rapids.{NvtxId, NvtxRegistry, PerfIO}
+import com.nvidia.spark.rapids.{NvtxId, NvtxRegistry}
 import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 import com.nvidia.spark.rapids.jni.RmmSpark
 
 import org.apache.spark.{SparkContext, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.util.{AccumulatorV2, LongAccumulator, Utils}
 
-case class NanoTime(value: java.lang.Long) {
-  override def toString: String = {
-    val hours = TimeUnit.NANOSECONDS.toHours(value)
-    var remaining = value - TimeUnit.HOURS.toNanos(hours)
-    val minutes = TimeUnit.NANOSECONDS.toMinutes(remaining)
-    remaining = remaining - TimeUnit.MINUTES.toNanos(minutes)
-    val seconds = remaining.toDouble / TimeUnit.SECONDS.toNanos(1)
-    val locale = Locale.US
-    "%02d:%02d:%06.3f".formatLocal(locale, hours, minutes, seconds)
-  }
-}
-
-// Format example:
-//  10.74GB (11534336000 bytes)
-//  1.23MB (1289750 bytes)
-//  1020.10KB (1044585 bytes)
-case class SizeInBytes(value: jl.Long) {
-  override def toString: String = {
-    var unitVal = value
-    var remainVal = 0L
-    var unitIndex = 0
-    while (unitIndex < SizeInBytes.SizeUnitNames.length && unitVal >= 1024) {
-      val nextUnitVal = unitVal >> 10
-      remainVal = unitVal - (nextUnitVal << 10)
-      unitVal = nextUnitVal
-      unitIndex += 1
-    }
-    val finalVal = "%.2f".format(unitVal + (remainVal.toDouble / 1024))
-    s"$finalVal${SizeInBytes.SizeUnitNames(unitIndex)} ($value bytes)"
-  }
-}
-
-private object SizeInBytes {
-  private val SizeUnitNames: Array[String] = Array("B", "KB", "MB", "GB", "TB", "PB", "EB")
-}
-
 class NanoSecondAccumulator extends AccumulatorV2[jl.Long, NanoTime] {
   private var _sum = 0L
   override def isZero: Boolean = _sum == 0
@@ -100,7 +61,7 @@ class NanoSecondAccumulator extends AccumulatorV2[jl.Long, NanoTime] {
         s"Cannot merge ${this.getClass.getName} with ${other.getClass.getName}")
   }
 
-  override def value: NanoTime = NanoTime(_sum)
+  override def value: NanoTime = new NanoTime(_sum)
 }
 
 /**
@@ -133,7 +94,7 @@ class SizeInBytesAccumulator extends AccumulatorV2[jl.Long, SizeInBytes] {
         s"Cannot merge ${this.getClass.getName} with ${other.getClass.getName}")
   }
 
-  override def value: SizeInBytes = SizeInBytes(_sum)
+  override def value: SizeInBytes = new SizeInBytes(_sum)
 
   private[spark] def setValue(newValue: Long): Unit = _sum = newValue
 }
@@ -164,7 +125,7 @@ class HighWatermarkAccumulator extends AccumulatorV2[jl.Long, SizeInBytes] {
         s"Cannot merge ${this.getClass.getName} with ${other.getClass.getName}")
   }
 
-  override def value: SizeInBytes = SizeInBytes(_value)
+  override def value: SizeInBytes = new SizeInBytes(_value)
 }
 
 class MaxLongAccumulator extends AccumulatorV2[jl.Long, jl.Long] {
@@ -242,7 +203,7 @@ class AvgLongAccumulator extends AccumulatorV2[jl.Long, jl.Double] {
   } else 0;
 }
 
-class GpuTaskMetrics extends Serializable with Logging {
+class GpuTaskMetrics extends Serializable {
   private val semaphoreHoldingTime = new NanoSecondAccumulator
   private val semWaitTimeNs = new NanoSecondAccumulator
   private val retryCount = new LongAccumulator
@@ -465,7 +426,8 @@ class GpuTaskMetrics extends Serializable with Logging {
       // allocations lives in the JNI. Therefore, we can stick the convention here of calling the
       // add method instead of adding a dedicated max method to the accumulator.
       if (maxDeviceMemoryBytes.value.value > 0) {
-        logError(s"updateMaxMemory called twice for task $taskAttemptId with maxMem $maxMem")
+        GpuTaskMetrics.log.error(s"updateMaxMemory called twice for task $taskAttemptId " +
+          s"with maxMem $maxMem")
       }
       maxDeviceMemoryBytes.add(maxMem)
     }
@@ -513,13 +475,13 @@ class GpuTaskMetrics extends Serializable with Logging {
    * to prevent double-counting — each new stage creates fresh accumulators with new IDs.
    */
   def recordPerfioS3BackendOnce(): Unit = {
-    val acc = PerfIO.s3BackendName match {
+    val acc = GpuTaskMetrics.perfIOS3BackendName match {
       case "netty" => perfioS3NettyExecutors
       case "crt"   => perfioS3CrtExecutors
       case _       => perfioS3S3aExecutors
     }
     try {
-      if (PerfIO.reportedBackendAccIds.add(acc.id)) {
+      if (GpuTaskMetrics.perfIOReportedBackendAccIds.add(acc.id)) {
         acc.add(1L)
       }
     } catch {
@@ -531,7 +493,26 @@ class GpuTaskMetrics extends Serializable with Logging {
 /**
  * Provides task level metrics
  */
-object GpuTaskMetrics extends Logging {
+object GpuTaskMetrics {
+  @transient private[this] lazy val perfIOModule = {
+    Class.forName("com.nvidia.spark.rapids.PerfIO" + "$")
+      .getField("MODULE" + "$")
+      .get(null)
+  }
+
+  @transient private[this] lazy val perfIOS3BackendNameMethod =
+    perfIOModule.getClass.getMethod("s3BackendName")
+  @transient private[this] lazy val perfIOReportedBackendAccIdsMethod =
+    perfIOModule.getClass.getMethod("reportedBackendAccIds")
+
+  private def perfIOS3BackendName: String =
+    perfIOS3BackendNameMethod.invoke(perfIOModule).asInstanceOf[String]
+
+  private def perfIOReportedBackendAccIds: java.util.Set[java.lang.Long] =
+    perfIOReportedBackendAccIdsMethod.invoke(perfIOModule)
+      .asInstanceOf[java.util.Set[java.lang.Long]]
+
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
   private val taskLevelMetrics = new ConcurrentHashMap[Long, GpuTaskMetrics]()
 
   private val hostBytesAllocated = new AtomicLong(0)
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/RapidsShuffleInternalManagerBase.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/RapidsShuffleInternalManagerBase.scala
index 69eff4ca387..96a0beba1a7 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/RapidsShuffleInternalManagerBase.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/RapidsShuffleInternalManagerBase.scala
@@ -37,7 +37,7 @@ import com.nvidia.spark.rapids.spill.SpillablePartialFileHandle
 
 import org.apache.spark.{InterruptibleIterator, MapOutputTracker, ShuffleDependency, SparkConf, SparkEnv, TaskContext}
 import org.apache.spark.executor.ShuffleWriteMetrics
-import org.apache.spark.internal.{config, Logging}
+import org.apache.spark.internal.config
 import org.apache.spark.io.CompressionCodec
 import org.apache.spark.network.buffer.ManagedBuffer
 import org.apache.spark.serializer.SerializerManager
@@ -71,7 +71,7 @@ class ShuffleHandleWithMetrics[K, V, C](
 abstract class GpuShuffleBlockResolverBase(
     val wrapped: IndexShuffleBlockResolver,
     catalog: ShuffleBufferCatalog)
-  extends ShuffleBlockResolver with Logging {
+  extends ShuffleBlockResolver with RapidsLocalLog {
   override def getBlockData(blockId: BlockId, dirs: Option[Array[String]]): ManagedBuffer = {
     // Get MultithreadedShuffleBufferCatalog dynamically since it may not be
     // initialized when the resolver is created
@@ -147,7 +147,7 @@ class ThreadSafeShuffleWriteMetricsReporter(val wrapped: ShuffleWriteMetricsRepo
   }
 }
 
-object RapidsShuffleInternalManagerBase extends Logging {
+object RapidsShuffleInternalManagerBase extends RapidsLocalLog {
   def unwrapHandle(handle: ShuffleHandle): ShuffleHandle = handle match {
     case gh: GpuShuffleHandle[_, _] => gh.wrapped
     case other => other
@@ -322,11 +322,11 @@ abstract class RapidsShuffleThreadedWriterBase[K, V](
 
   private var shuffleWriteRange: NvtxId = NvtxRegistry.THREADED_WRITER_WRITE.push()
 
-  // Case class for tracking partial sorted files in multi-batch scenario
-  private case class PartialFile(
-      handle: SpillablePartialFileHandle,
-      partitionLengths: Array[Long],
-      mapOutputWriter: ShuffleMapOutputWriter)
+  // Class for tracking partial sorted files in multi-batch scenario
+  private class PartialFile(
+      val handle: SpillablePartialFileHandle,
+      val partitionLengths: Array[Long],
+      val mapOutputWriter: ShuffleMapOutputWriter)
 
   /**
    * Represents a single compressed record ready to be written to disk.
@@ -337,10 +337,10 @@ abstract class RapidsShuffleThreadedWriterBase[K, V](
    * @param compressedSize The actual size of compressed data in buffer
    * @param remainingQuota The quota to release after writing to disk
    */
-  private case class CompressedRecord(
-    buffer: OpenByteArrayOutputStream,
-    compressedSize: Long,
-    remainingQuota: Long)
+  private class CompressedRecord(
+    val buffer: OpenByteArrayOutputStream,
+    val compressedSize: Long,
+    val remainingQuota: Long)
 
   /**
    * Encapsulates all state for processing one GPU batch in the multi-batch shuffle write.
@@ -370,19 +370,19 @@ abstract class RapidsShuffleThreadedWriterBase[K, V](
    * @param mergerSlotNum The merger thread pool slot assigned to this batch.
    * @param mergerFuture Future representing the merger task, used to wait for completion.
    */
-  private case class BatchState(
-    batchId: Int,
-    mapOutputWriter: ShuffleMapOutputWriter,
-    partitionRecords: ConcurrentHashMap[Int,
+  private class BatchState(
+    val batchId: Int,
+    val mapOutputWriter: ShuffleMapOutputWriter,
+    val partitionRecords: ConcurrentHashMap[Int,
       ConcurrentLinkedQueue[Future[CompressedRecord]]],
-    maxPartitionIdQueued: AtomicInteger,
-    mergerCondition: Object,
+    val maxPartitionIdQueued: AtomicInteger,
+    val mergerCondition: Object,
     // Flag for classic wait/notify pattern: set to true when new work is available,
     // reset to false after merger thread wakes up and checks actual data state.
     // This avoids busy-loop polling and provides clear signal for debugging.
-    hasNewWork: AtomicBoolean,
-    mergerSlotNum: Int,
-    mergerFuture: Future[_])
+    val hasNewWork: AtomicBoolean,
+    val mergerSlotNum: Int,
+    val mergerFuture: Future[_])
 
   /**
    * Increment the reference count and get the memory size for a value.
@@ -568,7 +568,7 @@ abstract class RapidsShuffleThreadedWriterBase[K, V](
         null
       })
 
-    BatchState(
+    new BatchState(
       batchId,
       writer,
       partitionRecords,
@@ -763,7 +763,7 @@ abstract class RapidsShuffleThreadedWriterBase[K, V](
               // Return CompressedRecord with buffer and remaining quota for Merger
               // Total released = excessQuota + remainingQuota should equal recordSize
               val remainingQuota = recordSize - excessQuota
-              CompressedRecord(buffer, compressedSize, remainingQuota)
+              new CompressedRecord(buffer, compressedSize, remainingQuota)
             }
           } catch {
             case e: Exception =>
@@ -823,7 +823,7 @@ abstract class RapidsShuffleThreadedWriterBase[K, V](
           // For multi-batch or when using catalog mode, extract handle
           val (handle, partLengths) = extractHandleAndLengthsFromWriter(
             batch.mapOutputWriter)
-          partialFiles += PartialFile(handle, partLengths, batch.mapOutputWriter)
+          partialFiles += new PartialFile(handle, partLengths, batch.mapOutputWriter)
         } else {
           // Single batch without catalog: commit normally
           commitAllPartitions(batch.mapOutputWriter, true)
@@ -1121,7 +1121,7 @@ abstract class RapidsShuffleThreadedReaderBase[K, C](
     mapOutputTracker: MapOutputTracker = SparkEnv.get.mapOutputTracker,
     canUseBatchFetch: Boolean = false,
     numReaderThreads: Int = 0)
-  extends ShuffleReader[K, C] with Logging {
+  extends ShuffleReader[K, C] with RapidsLocalLog {
 
   case class GetMapSizesResult(
       blocksByAddress: Iterator[(BlockManagerId, collection.Seq[(BlockId, Long, Int)])],
@@ -1712,8 +1712,8 @@ class RapidsCachingWriter[K, V](
  *       Apache Spark to use the RAPIDS shuffle manager,
  */
 class RapidsShuffleInternalManagerBase(conf: SparkConf, val isDriver: Boolean)
-  extends ShuffleManager with RapidsShuffleHeartbeatHandler with Logging
-  with RapidsShuffleReaderShim with ProxyShuffleReaderDelegate {
+  extends ShuffleManager with RapidsShuffleHeartbeatHandler
+  with RapidsLocalLog with RapidsShuffleReaderShim with ProxyShuffleReaderDelegate {
 
   def getServerId: BlockManagerId = server.fold(blockManager.blockManagerId)(_.getId)
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ShuffleCleanupListener.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ShuffleCleanupListener.scala
index 6fdae81c68a..f91cfbf4829 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ShuffleCleanupListener.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/ShuffleCleanupListener.scala
@@ -23,7 +23,6 @@ import scala.collection.mutable
 
 import com.nvidia.spark.rapids.ShuffleCleanupManager
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.scheduler.{SparkListener, SparkListenerEvent, SparkListenerJobStart}
 import org.apache.spark.sql.execution.SQLExecution
 import org.apache.spark.sql.execution.ui.SparkListenerSQLExecutionEnd
@@ -48,7 +47,22 @@ import org.apache.spark.sql.execution.ui.SparkListenerSQLExecutionEnd
  * Note: This file is placed in org.apache.spark.sql.rapids package to access
  * the private[spark] shuffleDepId field in StageInfo.
  */
-class ShuffleCleanupListener extends SparkListener with Logging {
+class ShuffleCleanupListener extends SparkListener {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[ShuffleCleanupListener])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   /**
    * Maps SQL execution ID to the set of shuffle IDs associated with that execution.
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/aggregate/aggregateFunctions.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/aggregate/aggregateFunctions.scala
index 2b9c5ea2b5e..dc71c038f95 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/aggregate/aggregateFunctions.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/aggregate/aggregateFunctions.scala
@@ -338,7 +338,7 @@ abstract class GpuMin(child: Expression) extends GpuAggregateFunction
 
   override def groupByScanAggregation(
       isRunningBatched: Boolean): Seq[AggAndReplace[GroupByScanAggregation]] =
-    Seq(AggAndReplace(GroupByScanAggregation.min(), Some(ReplacePolicy.PRECEDING)))
+    Seq(new AggAndReplace(GroupByScanAggregation.min(), Some(ReplacePolicy.PRECEDING)))
 
   override def isGroupByScanSupported: Boolean = child.dataType match {
     case StringType | TimestampType | DateType => false
@@ -347,7 +347,7 @@ abstract class GpuMin(child: Expression) extends GpuAggregateFunction
 
   override def scanInputProjection(isRunningBatched: Boolean): Seq[Expression] = inputProjection
   override def scanAggregation(isRunningBatched: Boolean): Seq[AggAndReplace[ScanAggregation]] =
-    Seq(AggAndReplace(ScanAggregation.min(), Some(ReplacePolicy.PRECEDING)))
+    Seq(new AggAndReplace(ScanAggregation.min(), Some(ReplacePolicy.PRECEDING)))
 
   override def isScanSupported: Boolean  = child.dataType match {
     case TimestampType | DateType => false
@@ -522,7 +522,7 @@ abstract class GpuMax(child: Expression) extends GpuAggregateFunction
 
   override def groupByScanAggregation(
       isRunningBatched: Boolean): Seq[AggAndReplace[GroupByScanAggregation]] =
-    Seq(AggAndReplace(GroupByScanAggregation.max(), Some(ReplacePolicy.PRECEDING)))
+    Seq(new AggAndReplace(GroupByScanAggregation.max(), Some(ReplacePolicy.PRECEDING)))
 
   override def isGroupByScanSupported: Boolean = child.dataType match {
     case StringType | TimestampType | DateType => false
@@ -531,7 +531,7 @@ abstract class GpuMax(child: Expression) extends GpuAggregateFunction
 
   override def scanInputProjection(isRunningBatched: Boolean): Seq[Expression] = inputProjection
   override def scanAggregation(isRunningBatched: Boolean): Seq[AggAndReplace[ScanAggregation]] =
-    Seq(AggAndReplace(ScanAggregation.max(), Some(ReplacePolicy.PRECEDING)))
+    Seq(new AggAndReplace(ScanAggregation.max(), Some(ReplacePolicy.PRECEDING)))
 
   override def isScanSupported: Boolean = child.dataType match {
     case TimestampType | DateType => false
@@ -1044,13 +1044,13 @@ abstract class GpuSum(
 
   override def groupByScanAggregation(
       isRunningBatched: Boolean): Seq[AggAndReplace[GroupByScanAggregation]] =
-    Seq(AggAndReplace(GroupByScanAggregation.sum(), Some(ReplacePolicy.PRECEDING)))
+    Seq(new AggAndReplace(GroupByScanAggregation.sum(), Some(ReplacePolicy.PRECEDING)))
 
   override def scanInputProjection(isRunningBatched: Boolean): Seq[Expression] =
     windowInputProjection
 
   override def scanAggregation(isRunningBatched: Boolean): Seq[AggAndReplace[ScanAggregation]] =
-    Seq(AggAndReplace(ScanAggregation.sum(), Some(ReplacePolicy.PRECEDING)))
+    Seq(new AggAndReplace(ScanAggregation.sum(), Some(ReplacePolicy.PRECEDING)))
 
   override def scanCombine(isRunningBatched: Boolean, cols: Seq[ColumnVector]): ColumnVector = {
     if (internalSumForWindowDataType != resultType) {
@@ -1498,13 +1498,13 @@ case class GpuCount(children: Seq[Expression],
 
   override def groupByScanAggregation(
       isRunningBatched: Boolean): Seq[AggAndReplace[GroupByScanAggregation]] =
-    Seq(AggAndReplace(GroupByScanAggregation.sum(), None))
+    Seq(new AggAndReplace(GroupByScanAggregation.sum(), None))
 
   override def scanInputProjection(isRunningBatched: Boolean): Seq[Expression] =
     groupByScanInputProjection(isRunningBatched)
 
   override def scanAggregation(isRunningBatched: Boolean): Seq[AggAndReplace[ScanAggregation]] =
-    Seq(AggAndReplace(ScanAggregation.sum(), None))
+    Seq(new AggAndReplace(ScanAggregation.sum(), None))
 
   override def scanCombine(isRunningBatched: Boolean, cols: Seq[ColumnVector]): ColumnVector =
     cols.head.castTo(DType.INT64)
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuEquivalentExpressions.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuEquivalentExpressions.scala
index 916bb2335da..314b2747176 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuEquivalentExpressions.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuEquivalentExpressions.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -50,7 +50,7 @@ class GpuEquivalentExpressions {
   private def addExprToMap(
       expr: Expression, map: mutable.HashMap[GpuExpressionEquals, GpuExpressionStats]): Boolean = {
     if (expr.deterministic) {
-      val wrapper = GpuExpressionEquals(expr)
+      val wrapper = new GpuExpressionEquals(expr)
       map.get(wrapper) match {
         case Some(stats) =>
           stats.useCount += 1
@@ -242,7 +242,7 @@ class GpuEquivalentExpressions {
    * Exposed for testing.
    */
   private[sql] def getExprState(e: Expression): Option[GpuExpressionStats] = {
-    equivalenceMap.get(GpuExpressionEquals(e))
+    equivalenceMap.get(new GpuExpressionEquals(e))
   }
 
   // Exposed for testing.
@@ -281,7 +281,7 @@ object GpuEquivalentExpressions {
     expr match {
       case e: AttributeReference => e
       case _ =>
-        substitutionMap.get(GpuExpressionEquals(expr)) match {
+        substitutionMap.get(new GpuExpressionEquals(expr)) match {
           case Some(attr) => attr
           case None => expr.mapChildren(replaceWithSemanticCommonRef(_, substitutionMap))
         }
@@ -510,7 +510,7 @@ trait GpuCombinable extends GpuExpression {
 /**
  * Wrapper around an Expression that provides semantic equality.
  */
-case class GpuExpressionEquals(e: Expression) {
+class GpuExpressionEquals(val e: Expression) {
   override def equals(o: Any): Boolean = o match {
     case other: GpuExpressionEquals => e.semanticEquals(other.e)
     case _ => false
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuRandomExpressions.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuRandomExpressions.scala
index 3f3ae2cf11e..b51fef4f83a 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuRandomExpressions.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/catalyst/expressions/GpuRandomExpressions.scala
@@ -100,7 +100,7 @@ case class GpuRand(child: Expression, doContextCheck: Boolean) extends ShimUnary
   private lazy val seed: Long = child match {
     case GpuLiteral(s, IntegerType) => s.asInstanceOf[Int]
     case GpuLiteral(s, LongType) => s.asInstanceOf[Long]
-    case _ => throw new RapidsAnalysisException(
+    case _ => throw RapidsAnalysisException(
       s"Input argument to $prettyName must be an integer, long or null literal.")
   }
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/collectionOperations.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/collectionOperations.scala
index b0a6602f0ef..ac1a582de43 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/collectionOperations.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/collectionOperations.scala
@@ -29,6 +29,7 @@ import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.jni.{GpuListSliceUtils, MapUtils}
 import com.nvidia.spark.rapids.shims.{GetSequenceSize, NullIntolerantShim, ShimExpression}
 
+import org.apache.spark.internal.config.ConfigEntry
 import org.apache.spark.sql.catalyst.analysis.{TypeCheckResult, TypeCoercion}
 import org.apache.spark.sql.catalyst.expressions.{ElementAt, ExpectsInputTypes, Expression, ImplicitCastInputTypes, NamedExpression, RowOrdering, Sequence, TimeZoneAwareExpression}
 import org.apache.spark.sql.catalyst.trees.{CurrentOrigin, Origin}
@@ -39,6 +40,14 @@ import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.ColumnarBatch
 import org.apache.spark.unsafe.array.ByteArrayMethods.MAX_ROUNDED_ARRAY_LENGTH
 
+object GpuMapDedupPolicy {
+  private val confEntry = SQLConf.MAP_KEY_DEDUP_POLICY.asInstanceOf[ConfigEntry[AnyRef]]
+
+  def current: String = SQLConf.get.getConf(confEntry).toString
+
+  def isException: Boolean = current.toUpperCase == "EXCEPTION"
+}
+
 case class GpuConcat(children: Seq[Expression]) extends GpuComplexTypeMergingExpression {
 
   @transient override lazy val dataType: DataType = {
@@ -522,9 +531,10 @@ case class GpuElementAt(left: Expression, right: Expression, failOnError: Boolea
               }
               withResource(hasLargerIndices) { _ =>
                 if (BoolUtils.isAnyValidTrue(hasLargerIndices)) {
-                  val (index, numElem) = firstIndexAndNumElementUnchecked(hasLargerIndices,
+                  val indexAndNumElement = firstIndexAndNumElementUnchecked(hasLargerIndices,
                     indices, numElements)
-                  throw RapidsErrorUtils.invalidArrayIndexError(index, numElem, true)
+                  throw RapidsErrorUtils.invalidArrayIndexError(
+                    indexAndNumElement.getIndex, indexAndNumElement.getNumElements, true)
                 }
               }
             }
@@ -739,7 +749,7 @@ case class GpuMapEntries(child: Expression) extends GpuUnaryExpression with Expe
 
 case class GpuMapFromEntries(child: Expression) extends GpuUnaryExpression with ExpectsInputTypes {
 
-  private val mapKeyDedupPolicy = SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY)
+  private val mapKeyDedupPolicy = GpuMapDedupPolicy.current
 
   override def inputTypes: Seq[AbstractDataType] = Seq(ArrayType)
 
@@ -1533,7 +1543,7 @@ case class GpuArraysOverlap(left: Expression, right: Expression)
 
 case class GpuMapFromArrays(left: Expression, right: Expression) extends GpuBinaryExpression {
 
-  private val mapKeyDedupPolicy = SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY)
+  private val mapKeyDedupPolicy = GpuMapDedupPolicy.current
 
   override def dataType: MapType = {
     MapType(
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeCreator.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeCreator.scala
index 4e21fa07ab1..e7f60b1eb8e 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeCreator.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeCreator.scala
@@ -151,9 +151,7 @@ object GpuCreateMap {
       SQLConf.get.getConf(SQLConf.LEGACY_CREATE_EMPTY_COLLECTION_USING_STRING_TYPE))
   }
 
-  // Spark 4.1+ returns an enum value instead of String, so use toString first
-  def exceptionOnDupKeys: Boolean =
-    SQLConf.get.getConf(SQLConf.MAP_KEY_DEDUP_POLICY).toString.toUpperCase == "EXCEPTION"
+  def exceptionOnDupKeys: Boolean = GpuMapDedupPolicy.isException
 
   def createMapFromKeysValuesAsStructs(dataType: MapType,
                                        listsOfKeyValueStructs : ColumnView): GpuColumnVector = {
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeExtractors.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeExtractors.scala
index 48e25a98367..676687d86e8 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeExtractors.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/complexTypeExtractors.scala
@@ -36,7 +36,6 @@ import org.apache.spark.sql.vectorized.ColumnarBatch
 case class GpuGetStructField(child: Expression, ordinal: Int, name: Option[String] = None)
     extends ShimUnaryExpression
     with GpuExpression
-    with ShimGetStructField
     with NullIntolerantShim {
 
   lazy val childSchema: StructType = child.dataType.asInstanceOf[StructType]
@@ -123,9 +122,10 @@ case class GpuGetArrayItem(child: Expression, ordinal: Expression, failOnError:
                 hasNegativeIndicesCV, array)
             withResource(hasValidEntryCV) { _ =>
               if (isAnyValidTrue(hasValidEntryCV)) {
-                val (index, numElem) = firstIndexAndNumElementUnchecked(hasValidEntryCV,
+                val indexAndNumElement = firstIndexAndNumElementUnchecked(hasValidEntryCV,
                   indices, numElements)
-                throw RapidsErrorUtils.invalidArrayIndexError(index, numElem)
+                throw RapidsErrorUtils.invalidArrayIndexError(
+                  indexAndNumElement.getIndex, indexAndNumElement.getNumElements)
               }
             }
             // Then check if any index is larger than its array size
@@ -133,9 +133,10 @@ case class GpuGetArrayItem(child: Expression, ordinal: Expression, failOnError:
               // No need to check the validity of array column here, since the validity info
               // is included in this `hasLargerIndicesCV`.
               if (isAnyValidTrue(hasLargerIndicesCV)) {
-                val (index, numElem) = firstIndexAndNumElementUnchecked(hasLargerIndicesCV,
+                val indexAndNumElement = firstIndexAndNumElementUnchecked(hasLargerIndicesCV,
                   indices, numElements)
-                throw RapidsErrorUtils.invalidArrayIndexError(index, numElem)
+                throw RapidsErrorUtils.invalidArrayIndexError(
+                  indexAndNumElement.getIndex, indexAndNumElement.getNumElements)
               }
             }
           }
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastExchangeExec.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastExchangeExec.scala
index ee0988d7f90..9915c49a706 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastExchangeExec.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastExchangeExec.scala
@@ -37,7 +37,6 @@ import com.nvidia.spark.rapids.shims.{BroadcastExchangeShims, ShimBroadcastExcha
 
 import org.apache.spark.SparkException
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.launcher.SparkLauncher
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
@@ -75,7 +74,7 @@ class SerializeConcatHostBuffersDeserializeBatch(
     output: Seq[Attribute],
     var numRows: Int,
     var dataLen: Long)
-  extends Serializable with Logging {
+  extends Serializable {
   @transient private var dataTypes = output.map(_.dataType).toArray
 
   // used for memoization of deserialization to GPU on Executor
@@ -323,7 +322,7 @@ class GpuBroadcastMeta(
     conf: RapidsConf,
     parent: Option[RapidsMeta[_, _, _]],
     rule: DataFromReplacementRule) extends
-  SparkPlanMeta[BroadcastExchangeExec](exchange, conf, parent, rule) with Logging {
+  SparkPlanMeta[BroadcastExchangeExec](exchange, conf, parent, rule) {
 
   override def tagPlanForGpu(): Unit = {
     if (!TrampolineUtil.isSupportedRelation(exchange.mode)) {
@@ -643,7 +642,7 @@ case class GpuBroadcastExchangeExec(
 }
 
 /** Caches the mappings from canonical CPU exchanges to the GPU exchanges that replaced them */
-object ExchangeMappingCache extends Logging {
+object ExchangeMappingCache {
   // Cache is a mapping from CPU broadcast plan to GPU broadcast plan. The cache should not
   // artificially hold onto unused plans, so we make both the keys and values weak. The values
   // point to their corresponding keys, so the keys will not be collected unless the value
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastToRowExec.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastToRowExec.scala
index 2b2c11ada2a..2f6d51aba84 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastToRowExec.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuBroadcastToRowExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,7 +28,6 @@ import com.nvidia.spark.rapids.shims.{ShimBroadcastExchangeLike, ShimUnaryExecNo
 
 import org.apache.spark.SparkException
 import org.apache.spark.broadcast.Broadcast
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{BoundReference, Expression, UnsafeProjection}
@@ -46,7 +45,7 @@ case class GpuBroadcastToRowExec(
   buildKeys: Seq[Expression],
   broadcastMode: BroadcastMode,
   child: SparkPlan)
-  extends ShimBroadcastExchangeLike with ShimUnaryExecNode with GpuExec with Logging {
+  extends ShimBroadcastExchangeLike with ShimUnaryExecNode with GpuExec {
 
   @transient
   private val timeout: Long = conf.broadcastTimeout
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuHashJoin.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuHashJoin.scala
index 78b6154f52b..5d4087852c4 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuHashJoin.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuHashJoin.scala
@@ -78,9 +78,9 @@ object JoinTypeChecks {
     joinRideAlongTypes,
     TypeSig.all,
     Map(
-      LEFT_KEYS -> InputCheck(cudfSupportedKeyTypes, sparkSupportedJoinKeyTypes),
-      RIGHT_KEYS -> InputCheck(cudfSupportedKeyTypes, sparkSupportedJoinKeyTypes),
-      CONDITION -> InputCheck(TypeSig.BOOLEAN, TypeSig.BOOLEAN)))
+      LEFT_KEYS -> new InputCheck(cudfSupportedKeyTypes, sparkSupportedJoinKeyTypes, List.empty),
+      RIGHT_KEYS -> new InputCheck(cudfSupportedKeyTypes, sparkSupportedJoinKeyTypes, List.empty),
+      CONDITION -> new InputCheck(TypeSig.BOOLEAN, TypeSig.BOOLEAN, List.empty)))
 
   def equiJoinMeta(leftKeys: Seq[BaseExprMeta[_]],
       rightKeys: Seq[BaseExprMeta[_]],
@@ -94,7 +94,7 @@ object JoinTypeChecks {
   val nonEquiJoinChecks: ExecChecks = ExecChecks(
     joinRideAlongTypes,
     TypeSig.all,
-    Map(CONDITION -> InputCheck(TypeSig.BOOLEAN, TypeSig.BOOLEAN,
+    Map(CONDITION -> new InputCheck(TypeSig.BOOLEAN, TypeSig.BOOLEAN,
       notes = List("A non-inner join only is supported if the condition expression can be " +
           "converted to a GPU AST expression"))))
 
@@ -1063,44 +1063,6 @@ object JoinBuildSideSelection extends Enumeration {
   }
 }
 
-/**
- * Options to control join behavior.
- * @param strategy the join strategy to use (AUTO, INNER_HASH_WITH_POST, INNER_SORT_WITH_POST,
- *                 or HASH_ONLY)
- * @param buildSideSelection the build side selection strategy (AUTO, FIXED, or SMALLEST)
- * @param targetSize the target batch size in bytes for the join operation
- * @param logCardinalityEnabled whether to log cardinality statistics for debugging
- * @param sizeEstimateThreshold the threshold used to decide when to skip the expensive join
- *                              output size estimation (defaults to 0.75)
- */
-case class JoinOptions(
-    strategy: JoinStrategy.JoinStrategy,
-    buildSideSelection: JoinBuildSideSelection.JoinBuildSideSelection,
-    targetSize: Long,
-    logCardinalityEnabled: Boolean,
-    sizeEstimateThreshold: Double)
-
-/**
- * Statistics for join cardinality logging to help diagnose performance issues.
- * @param leftRowCount number of rows on the left side
- * @param rightRowCount number of rows on the right side
- * @param leftDistinctCount distinct count of left join keys
- * @param rightDistinctCount distinct count of right join keys
- * @param leftNullCounts null counts for each left key column
- * @param rightNullCounts null counts for each right key column
- * @param leftKeyTypes data types of the left join keys
- * @param rightKeyTypes data types of the right join keys
- */
-case class JoinCardinalityStats(
-    leftRowCount: Long,
-    rightRowCount: Long,
-    leftDistinctCount: Long,
-    rightDistinctCount: Long,
-    leftNullCounts: Seq[Long],
-    rightNullCounts: Seq[Long],
-    leftKeyTypes: Seq[DataType],
-    rightKeyTypes: Seq[DataType])
-
 /**
  * Class to hold statistics on the build-side batch of a hash join.
  * @param streamMagnificationFactor estimated magnification of a stream batch during join
@@ -1188,6 +1150,12 @@ abstract class BaseHashJoinIterator(
    * Compute cardinality statistics for both sides of the join.
    * This is used for diagnostic logging when logJoinCardinality is enabled.
    */
+  protected def joinStrategy: JoinStrategy.JoinStrategy =
+    joinOptions.strategy.asInstanceOf[JoinStrategy.JoinStrategy]
+
+  protected def buildSideSelection: JoinBuildSideSelection.JoinBuildSideSelection =
+    joinOptions.buildSideSelection.asInstanceOf[JoinBuildSideSelection.JoinBuildSideSelection]
+
   protected def computeCardinalityStats(
       leftKeys: Table,
       rightKeys: Table): JoinCardinalityStats = {
@@ -1207,7 +1175,7 @@ abstract class BaseHashJoinIterator(
     val leftKeyTypes = boundBuiltKeys.map(_.dataType)
     val rightKeyTypes = boundStreamKeys.map(_.dataType)
     
-    JoinCardinalityStats(
+    new JoinCardinalityStats(
       leftRowCount,
       rightRowCount,
       leftDistinctCount,
@@ -1550,10 +1518,10 @@ class HashJoinIterator(
       rightData: LazySpillableColumnarBatch): GatherMapsResult = {
     // Apply heuristics to select the effective strategy
     val effectiveStrategy = JoinStrategy.selectStrategy(
-      joinOptions.strategy,
+      joinStrategy,
       joinType,
       hasCondition = false,  // This is called for unconditional joins
-      joinOptions.buildSideSelection,
+      buildSideSelection,
       leftKeys.getRowCount,
       rightKeys.getRowCount)
 
@@ -1594,7 +1562,7 @@ class HashJoinIterator(
     logJoinCardinality(leftKeys, rightKeys, implName)
 
     val innerMaps = JoinImpl.innerHashJoin(leftKeys, rightKeys, compareNullsEqual,
-      joinOptions.buildSideSelection, buildSide)
+      buildSideSelection, buildSide)
 
     val leftRowCount = leftKeys.getRowCount
     val rightRowCount = rightKeys.getRowCount
@@ -1610,7 +1578,7 @@ class HashJoinIterator(
     logJoinCardinality(leftKeys, rightKeys, "INNER_SORT_WITH_POST")
     
     val innerMaps = JoinImpl.innerSortJoin(leftKeys, rightKeys, compareNullsEqual,
-      joinOptions.buildSideSelection, buildSide)
+      buildSideSelection, buildSide)
 
     val leftRowCount = leftKeys.getRowCount
     val rightRowCount = rightKeys.getRowCount
@@ -1632,7 +1600,7 @@ class HashJoinIterator(
         JoinImpl.rightOuterHashJoinBuildLeft(leftKeys, rightKeys, compareNullsEqual)
       case _: InnerLike =>
         JoinImpl.innerHashJoin(leftKeys, rightKeys, compareNullsEqual,
-          joinOptions.buildSideSelection, buildSide)
+          buildSideSelection, buildSide)
       case LeftSemi =>
         JoinImpl.leftSemiHashJoinBuildRight(leftKeys, rightKeys, compareNullsEqual)
       case LeftAnti =>
@@ -1696,10 +1664,10 @@ class ConditionalHashJoinIterator(
         withResource(GpuColumnVector.from(rightData.getBatch)) { rightTable =>
           // Apply heuristics to select the effective strategy for conditional joins
           val effectiveStrategy = JoinStrategy.selectStrategy(
-            joinOptions.strategy,
+            joinStrategy,
             joinType,
             hasCondition = true,  // This is a conditional join
-            joinOptions.buildSideSelection,
+            buildSideSelection,
             leftKeys.getRowCount,
             rightKeys.getRowCount)
 
@@ -1750,7 +1718,7 @@ class ConditionalHashJoinIterator(
     val rightRowCount = rightKeys.getRowCount
 
     val innerMaps = JoinImpl.innerHashJoin(leftKeys, rightKeys,
-      nullEquality == NullEquality.EQUAL, joinOptions.buildSideSelection, buildSide)
+      nullEquality == NullEquality.EQUAL, buildSideSelection, buildSide)
 
     val compiledCondition = lazyCompiledCondition.getForBuildSide(buildSide)
 
@@ -1777,7 +1745,7 @@ class ConditionalHashJoinIterator(
     val rightRowCount = rightKeys.getRowCount
 
     val innerMaps = JoinImpl.innerSortJoin(leftKeys, rightKeys,
-      nullEquality == NullEquality.EQUAL, joinOptions.buildSideSelection, buildSide)
+      nullEquality == NullEquality.EQUAL, buildSideSelection, buildSide)
 
     val compiledCondition = lazyCompiledCondition.getForBuildSide(buildSide)
 
@@ -1804,7 +1772,7 @@ class ConditionalHashJoinIterator(
       case _: InnerLike =>
         // For inner joins, use dynamic build side selection
         val selectedBuildSide = JoinBuildSideSelection.selectPhysicalBuildSide(
-          joinOptions.buildSideSelection, buildSide,
+          buildSideSelection, buildSide,
           leftKeys.getRowCount, rightKeys.getRowCount)
         selectedBuildSide match {
           case GpuBuildLeft =>
@@ -1933,10 +1901,10 @@ class HashJoinStreamSideIterator(
     // Apply heuristics to select the effective strategy for unconditional joins
     // Note: subJoinType is used for strategy selection since that's what we're actually executing
     val effectiveStrategy = JoinStrategy.selectStrategy(
-      joinOptions.strategy,
+      joinStrategy,
       subJoinType,
       hasCondition = false,
-      joinOptions.buildSideSelection,
+      buildSideSelection,
       leftKeys.getRowCount,
       rightKeys.getRowCount)
     
@@ -1977,7 +1945,7 @@ class HashJoinStreamSideIterator(
     logJoinCardinality(leftKeys, rightKeys, implName, originalJoinType)
 
     val innerMaps = JoinImpl.innerHashJoin(leftKeys, rightKeys, compareNullsEqual,
-      joinOptions.buildSideSelection, cudfBuildSide)
+      buildSideSelection, cudfBuildSide)
 
     val leftRowCount = leftKeys.getRowCount
     val rightRowCount = rightKeys.getRowCount
@@ -1996,7 +1964,7 @@ class HashJoinStreamSideIterator(
       originalJoinType)
 
     val innerMaps = JoinImpl.innerSortJoin(leftKeys, rightKeys, compareNullsEqual,
-      joinOptions.buildSideSelection, cudfBuildSide)
+      buildSideSelection, cudfBuildSide)
 
     val leftRowCount = leftKeys.getRowCount
     val rightRowCount = rightKeys.getRowCount
@@ -2020,7 +1988,7 @@ class HashJoinStreamSideIterator(
         JoinImpl.rightOuterHashJoinBuildLeft(leftKeys, rightKeys, compareNullsEqual)
       case Inner =>
         JoinImpl.innerHashJoin(leftKeys, rightKeys, compareNullsEqual,
-          joinOptions.buildSideSelection, cudfBuildSide)
+          buildSideSelection, cudfBuildSide)
       case t =>
         throw new IllegalStateException(s"unsupported join type: $t")
     }
@@ -2041,10 +2009,10 @@ class HashJoinStreamSideIterator(
       withResource(GpuColumnVector.from(rightData.getBatch)) { rightTable =>
         // Apply heuristics to select the effective strategy for conditional joins
         val effectiveStrategy = JoinStrategy.selectStrategy(
-          joinOptions.strategy,
+          joinStrategy,
           subJoinType,
           hasCondition = true,
-          joinOptions.buildSideSelection,
+          buildSideSelection,
           leftKeys.getRowCount,
           rightKeys.getRowCount)
 
@@ -2093,7 +2061,7 @@ class HashJoinStreamSideIterator(
     logJoinCardinality(leftKeys, rightKeys, implName, originalJoinType)
 
     val innerMaps = JoinImpl.innerHashJoin(leftKeys, rightKeys, compareNullsEqual,
-      joinOptions.buildSideSelection, cudfBuildSide)
+      buildSideSelection, cudfBuildSide)
 
     val compiledCondition = lazyCondition.getForBuildSide(cudfBuildSide)
 
@@ -2122,7 +2090,7 @@ class HashJoinStreamSideIterator(
       originalJoinType)
 
     val innerMaps = JoinImpl.innerSortJoin(leftKeys, rightKeys, compareNullsEqual,
-      joinOptions.buildSideSelection, cudfBuildSide)
+      buildSideSelection, cudfBuildSide)
 
     val compiledCondition = lazyCondition.getForBuildSide(cudfBuildSide)
 
@@ -2161,7 +2129,7 @@ class HashJoinStreamSideIterator(
         // For inner sub-joins, use dynamic build side selection
         // For sub-joins, the plan build side is cudfBuildSide (GpuBuildRight for Inner)
         val selectedBuildSide = JoinBuildSideSelection.selectPhysicalBuildSide(
-          joinOptions.buildSideSelection, cudfBuildSide,
+          buildSideSelection, cudfBuildSide,
           leftKeys.getRowCount, rightKeys.getRowCount)
         selectedBuildSide match {
           case GpuBuildLeft =>
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuShuffleExchangeExecBase.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuShuffleExchangeExecBase.scala
index bd7c4147827..3726566c866 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuShuffleExchangeExecBase.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuShuffleExchangeExecBase.scala
@@ -419,7 +419,11 @@ object GpuShuffleExchangeExecBase {
       }.toArray.toSeq
       val sorter = new GpuSorter(boundReferences, outputAttributes, metrics)
       rdd.mapPartitions { cbIter =>
-        GpuSortEachBatchIterator(cbIter, sorter, false)
+        new GpuSortEachBatchIterator(cbIter, sorter, false,
+          opTime = NoopMetric,
+          sortTime = NoopMetric,
+          outputBatches = NoopMetric,
+          outputRows = NoopMetric)
       }
     } else {
       rdd
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuSubPartitionHashJoin.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuSubPartitionHashJoin.scala
index 12faa151a4b..4eebeb813db 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuSubPartitionHashJoin.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/GpuSubPartitionHashJoin.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023-2025, NVIDIA CORPORATION. All rights reserved.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -18,12 +18,13 @@ package org.apache.spark.sql.rapids.execution
 import scala.collection.mutable
 import scala.collection.mutable.ArrayBuffer
 
-import com.nvidia.spark.rapids.{GpuBatchUtils, GpuColumnVector, GpuExpression, GpuHashPartitioner, GpuMetric, NvtxRegistry, RmmRapidsRetryIterator, SpillableColumnarBatch, SpillPriorities, TaskAutoCloseableResource}
+import com.nvidia.spark.rapids.{GpuBatchUtils, GpuColumnVector, GpuExpression, GpuHashPartitioner,
+  GpuMetric, NvtxRegistry, RapidsLocalLog, RmmRapidsRetryIterator, SpillableColumnarBatch,
+  SpillPriorities, TaskAutoCloseableResource}
 import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.RapidsPluginImplicits._
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.plans.InnerLike
 import org.apache.spark.sql.rapids.{GpuHashExpression, GpuMurmur3Hash}
 import org.apache.spark.sql.rapids.shims.DataTypeUtilsShim
@@ -89,7 +90,7 @@ class GpuBatchSubPartitioner(
     numPartitions: Int,
     hashSeed: Int,
     name: String = "GpuBatchSubPartitioner") extends GpuHashPartitioner
-  with AutoCloseable with Logging {
+  with AutoCloseable with RapidsLocalLog {
 
   private var isNotInited = true
   private var numCurBatches = 0
@@ -228,7 +229,7 @@ class GpuBatchSubPartitioner(
 class GpuBatchSubPartitionIterator(
     batchSubPartitioner: GpuBatchSubPartitioner,
     targetBatchSize: Long)
-  extends Iterator[(Seq[Int], Seq[SpillableColumnarBatch])] with Logging {
+  extends Iterator[(Seq[Int], Seq[SpillableColumnarBatch])] with RapidsLocalLog {
 
   // The partitions to be read. Initially it is all the partitions.
   private val remainingPartIds: ArrayBuffer[Int] =
@@ -558,7 +559,7 @@ abstract class BaseSubHashJoinIterator(
   protected def setupJoinIterator(pair: PartitionPair): Option[Iterator[ColumnarBatch]]
 }
 
-trait GpuSubPartitionHashJoin extends Logging { self: GpuHashJoin =>
+trait GpuSubPartitionHashJoin { self: GpuHashJoin =>
 
   protected lazy val buildSchema: StructType = DataTypeUtilsShim.fromAttributes(buildPlan.output)
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/InternalColumnarRddConverter.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/InternalColumnarRddConverter.scala
index 02eaafb5ed4..3707023e834 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/InternalColumnarRddConverter.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/InternalColumnarRddConverter.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2025, NVIDIA CORPORATION. All rights reserved.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION. All rights reserved.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,7 +21,6 @@ import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.GpuColumnVector.GpuColumnarBatchBuilder
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.{MapPartitionsRDD, RDD}
 import org.apache.spark.sql.{DataFrame, Row}
 import org.apache.spark.sql.catalyst.InternalRow
@@ -102,22 +101,22 @@ private object GpuExternalRowToColumnConverter {
       // NOT SUPPORTED YET
       // case CalendarIntervalType => CalendarConverter
       case (at: ArrayType, true) =>
-        ArrayConverter(getConverterForType(at.elementType, at.containsNull))
+        new ArrayConverter(getConverterForType(at.elementType, at.containsNull))
       case (at: ArrayType, false) =>
-        NotNullArrayConverter(getConverterForType(at.elementType, at.containsNull))
+        new NotNullArrayConverter(getConverterForType(at.elementType, at.containsNull))
       case (st: StructType, true) =>
-        StructConverter(st.fields.map(getConverterFor))
+        new StructConverter(st.fields.map(getConverterFor))
       case (st: StructType, false) =>
-        NotNullStructConverter(st.fields.map(getConverterFor))
+        new NotNullStructConverter(st.fields.map(getConverterFor))
       case (dt: DecimalType, true) =>
         new DecimalConverter(dt.precision, dt.scale)
       case (dt: DecimalType, false) =>
         new NotNullDecimalConverter(dt.precision, dt.scale)
       case (MapType(k, v, vcn), true) =>
-        MapConverter(getConverterForType(k, nullable = false),
+        new MapConverter(getConverterForType(k, nullable = false),
           getConverterForType(v, vcn))
       case (MapType(k, v, vcn), false) =>
-        NotNullMapConverter(getConverterForType(k, nullable = false),
+        new NotNullMapConverter(getConverterForType(k, nullable = false),
           getConverterForType(v, vcn))
       case (NullType, true) =>
         NullConverter
@@ -394,7 +393,7 @@ private object GpuExternalRowToColumnConverter {
     ret + OFFSET
   }
 
-  private case class MapConverter(
+  private class MapConverter(
     keyConverter: TypeConverter,
     valueConverter: TypeConverter) extends TypeConverter {
     override def append(row: Row,
@@ -410,7 +409,7 @@ private object GpuExternalRowToColumnConverter {
     override def getNullSize: Double = VALIDITY_N_OFFSET
   }
 
-  private case class NotNullMapConverter(
+  private class NotNullMapConverter(
     keyConverter: TypeConverter,
     valueConverter: TypeConverter) extends TypeConverter {
     override def append(row: Row,
@@ -453,7 +452,7 @@ private object GpuExternalRowToColumnConverter {
     ret + OFFSET
   }
 
-  private case class ArrayConverter(childConverter: TypeConverter)
+  private class ArrayConverter(childConverter: TypeConverter)
     extends TypeConverter {
     override def append(row: Row,
       column: Int, builder: RapidsHostColumnBuilder): Double = {
@@ -468,7 +467,7 @@ private object GpuExternalRowToColumnConverter {
     override def getNullSize: Double = VALIDITY_N_OFFSET
   }
 
-  private case class NotNullArrayConverter(childConverter: TypeConverter)
+  private class NotNullArrayConverter(childConverter: TypeConverter)
     extends TypeConverter {
     override def append(row: Row,
       column: Int, builder: RapidsHostColumnBuilder): Double = {
@@ -492,7 +491,7 @@ private object GpuExternalRowToColumnConverter {
     ret
   }
 
-  private case class StructConverter(
+  private class StructConverter(
     childConverters: Array[TypeConverter]) extends TypeConverter {
     override def append(row: Row,
       column: Int,
@@ -509,7 +508,7 @@ private object GpuExternalRowToColumnConverter {
     override def getNullSize: Double = childConverters.map(_.getNullSize).sum + VALIDITY
   }
 
-  private case class NotNullStructConverter(
+  private class NotNullStructConverter(
     childConverters: Array[TypeConverter]) extends TypeConverter {
     override def append(row: Row,
       column: Int,
@@ -645,7 +644,11 @@ private class ExternalRowToColumnarIterator(
  * of GPU memory.  By convention it is the responsibility of the one consuming the data to close it
  * when they no longer need it.
  */
-object InternalColumnarRddConverter extends Logging {
+object InternalColumnarRddConverter {
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logDebug(msg: => String): Unit = if (log.isDebugEnabled) log.debug(msg)
+
   def apply(df: DataFrame): RDD[Table] = {
     convert(df)
   }
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/ShuffledBatchRDD.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/ShuffledBatchRDD.scala
index 34c99f40dd9..c1256631c86 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/ShuffledBatchRDD.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/ShuffledBatchRDD.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2022, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -32,7 +32,8 @@ import org.apache.spark.sql.execution.metric.{SQLMetric, SQLShuffleReadMetricsRe
 import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-case class ShuffledBatchRDDPartition(index: Int, spec: ShufflePartitionSpec) extends Partition
+class ShuffledBatchRDDPartition(override val index: Int, val spec: ShufflePartitionSpec)
+  extends Partition
 
 /**
  * A dummy partitioner for use with records whose partition ids have been pre-computed (i.e. for
@@ -135,7 +136,7 @@ class ShuffledBatchRDD(
 
   override def getPartitions: Array[Partition] = {
     Array.tabulate[Partition](partitionSpecs.length) { i =>
-      ShuffledBatchRDDPartition(i, partitionSpecs(i))
+      new ShuffledBatchRDDPartition(i, partitionSpecs(i))
     }
   }
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/TrampolineUtil.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/TrampolineUtil.scala
index 538df0c9d61..71943859784 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/TrampolineUtil.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/TrampolineUtil.scala
@@ -18,8 +18,8 @@ package org.apache.spark.sql.rapids.execution
 
 import java.util.concurrent.{ExecutorService, ScheduledExecutorService, ThreadPoolExecutor}
 
+import org.apache.avro.Schema
 import org.apache.hadoop.conf.Configuration
-import org.json4s.JsonAST
 
 import org.apache.spark.{SparkConf, SparkContext, SparkEnv, SparkMasterRegex, SparkUpgradeException, TaskContext}
 import org.apache.spark.broadcast.Broadcast
@@ -40,7 +40,6 @@ import org.apache.spark.sql.internal.SQLConf
 import org.apache.spark.sql.rapids.GpuTaskMetrics
 import org.apache.spark.sql.rapids.shims.DataTypeUtilsShim
 import org.apache.spark.sql.rapids.shims.SparkUpgradeExceptionShims
-import org.apache.spark.sql.rapids.shims.TrampolineConnectShims
 import org.apache.spark.sql.types.{DataType, StructType}
 import org.apache.spark.storage.BlockManagerId
 import org.apache.spark.util.{ShutdownHookManager, ThreadUtils, Utils}
@@ -59,7 +58,23 @@ object TrampolineUtil {
   def toAttributes(structType: StructType): Seq[Attribute] =
     DataTypeUtilsShim.toAttributes(structType)
 
-  def jsonValue(dataType: DataType): JsonAST.JValue = dataType.jsonValue
+  private[this] lazy val dataTypeJsonValue = classOf[DataType].getMethod("jsonValue")
+
+  def jsonValue(dataType: DataType): AnyRef = dataTypeJsonValue.invoke(dataType)
+
+  private[this] lazy val trampolineConnectShims = Class
+    .forName("org.apache.spark.sql.rapids.shims.TrampolineConnectShims$")
+    .getField("MODULE$")
+    .get(null)
+
+  private[this] lazy val cleanupAnyExistingSessionMethod =
+    trampolineConnectShims.getClass.getMethod("cleanupAnyExistingSession")
+
+  private[this] lazy val createSchemaParserMethod =
+    trampolineConnectShims.getClass.getMethod("createSchemaParser")
+
+  def createSchemaParser(): Schema.Parser =
+    createSchemaParserMethod.invoke(trampolineConnectShims).asInstanceOf[Schema.Parser]
 
   /** Get a human-readable string, e.g.: "4.0 MiB", for a value in bytes. */
   def bytesToString(size: Long): String = Utils.bytesToString(size)
@@ -103,7 +118,8 @@ object TrampolineUtil {
   }
 
   /** Shuts down and cleans up any existing Spark session */
-  def cleanupAnyExistingSession(): Unit = TrampolineConnectShims.cleanupAnyExistingSession()
+  def cleanupAnyExistingSession(): Unit =
+    cleanupAnyExistingSessionMethod.invoke(trampolineConnectShims)
 
   def asNullable(dt: DataType): DataType = dt.asNullable
 
@@ -263,9 +279,72 @@ object TrampolineUtil {
 }
 
 /**
- * This class is to only be used to throw errors specific to the
- * RAPIDS Accelerator or errors mirroring Spark where a raw
- * AnalysisException is thrown directly rather than via an error
- * utility class (this should be rare).
+ * Factory for raw-message AnalysisExceptions where Spark has no error utility.
  */
-class RapidsAnalysisException(msg: String) extends AnalysisException(msg)
+object RapidsAnalysisException {
+  private type CtorAndArgs = (java.lang.reflect.Constructor[AnyRef], Array[AnyRef])
+
+  private val none = None
+  private val emptyMessageParameters = Map.empty[String, String]
+  private val emptyStringArray = Array.empty[String]
+
+  def apply(msg: String): AnalysisException = {
+    val maybeCtorAndArgs = rawMessageCtor7(msg)
+      .orElse(rawMessageCtor8(msg))
+      .orElse(rawMessageCtorWithStringParameters(msg))
+
+    val (ctor, args) = maybeCtorAndArgs.getOrElse {
+      throw new IllegalStateException("Unsupported AnalysisException constructor shape")
+    }
+    ctor.newInstance(args: _*).asInstanceOf[AnalysisException]
+  }
+
+  private def rawMessageCtor7(msg: String): Option[CtorAndArgs] = {
+    classOf[AnalysisException].getConstructors.find { ctor =>
+      val params = ctor.getParameterTypes
+      params.length == 7 &&
+        params(0) == classOf[String] &&
+        params(5).getName == "scala.collection.immutable.Map" &&
+        isQueryContextArray(params(6))
+    }.map { ctor =>
+      val typedCtor = ctor.asInstanceOf[java.lang.reflect.Constructor[AnyRef]]
+      typedCtor -> Array[AnyRef](msg, none, none, none, none,
+        emptyMessageParameters, emptyQueryContextArray)
+    }
+  }
+
+  private def rawMessageCtor8(msg: String): Option[CtorAndArgs] = {
+    classOf[AnalysisException].getConstructors.find { ctor =>
+      val params = ctor.getParameterTypes
+      params.length == 8 &&
+        params(0) == classOf[String] &&
+        params(6).getName == "scala.collection.immutable.Map" &&
+        isQueryContextArray(params(7))
+    }.map { ctor =>
+      val typedCtor = ctor.asInstanceOf[java.lang.reflect.Constructor[AnyRef]]
+      typedCtor -> Array[AnyRef](msg, none, none, none, none, none,
+        emptyMessageParameters, emptyQueryContextArray)
+    }
+  }
+
+  private def rawMessageCtorWithStringParameters(msg: String): Option[CtorAndArgs] = {
+    classOf[AnalysisException].getConstructors.find { ctor =>
+      val params = ctor.getParameterTypes
+      params.length == 7 &&
+        params(0) == classOf[String] &&
+        params(6).isArray &&
+        params(6).getComponentType == classOf[String]
+    }.map { ctor =>
+      val typedCtor = ctor.asInstanceOf[java.lang.reflect.Constructor[AnyRef]]
+      typedCtor -> Array[AnyRef](msg, none, none, none, none, none, emptyStringArray)
+    }
+  }
+
+  private def isQueryContextArray(cls: Class[_]): Boolean = {
+    cls.isArray && cls.getComponentType.getName == "org.apache.spark.QueryContext"
+  }
+
+  private def emptyQueryContextArray: AnyRef = {
+    java.lang.reflect.Array.newInstance(Class.forName("org.apache.spark.QueryContext"), 0)
+  }
+}
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/BatchGroupUtils.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/BatchGroupUtils.scala
index 5baa2974f53..97ab778ce50 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/BatchGroupUtils.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/BatchGroupUtils.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -41,10 +41,10 @@ import org.apache.spark.sql.vectorized.ColumnarBatch
  *                   and data columns by the Python workers.
  * @param groupingOffsets the grouping offsets(aka column indices) in the deduplicated attributes.
  */
-case class GroupArgs(
-    dedupAttrs: Seq[Attribute],
-    argOffsets: Array[Int],
-    groupingOffsets: Seq[Int])
+class GroupArgs(
+    val dedupAttrs: Seq[Attribute],
+    val argOffsets: Array[Int],
+    val groupingOffsets: Seq[Int])
 
 /**
  * Basic functionality to deal with groups in a batch.
@@ -138,7 +138,7 @@ private[python] object BatchGroupUtils {
     val argOffsets = Array(argOffsetLen, groupingAttrs.length) ++
       groupingArgOffsets ++ dataAttrs.indices
 
-    GroupArgs(dedupAttrs, argOffsets, groupingArgOffsets)
+    new GroupArgs(dedupAttrs, argOffsets, groupingArgOffsets)
   }
 
   /**
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuAggregateInPandasExec.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuAggregateInPandasExec.scala
index c791ce3292a..3cb30cb1ce1 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuAggregateInPandasExec.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuAggregateInPandasExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -116,6 +116,9 @@ case class GpuAggregateInPandasExec(
     // Filter child output attributes down to only those that are UDF inputs.
     // Also eliminate duplicate UDF inputs.
     val udfArgs = PythonArgumentUtils.flatten(inputs)
+    val udfFlattenedArgs = udfArgs.flattenedArgs
+    val udfArgOffsets = udfArgs.argOffsets
+    val udfArgNames = udfArgs.argNames
 
     // Schema of input rows to the python runner
     val aggInputSchema = StructType(udfArgs.flattenedTypes.zipWithIndex.map { case (dt, i) =>
@@ -136,7 +139,7 @@ case class GpuAggregateInPandasExec(
       // Doing this can reduce the data size to be split, probably getting a better performance.
       val groupingRefs = GpuBindReferences.bindGpuReferences(gpuGroupingExpressions,
         childOutput, allMetrics)
-      val pyInputRefs = GpuBindReferences.bindGpuReferences(udfArgs.flattenedArgs,
+      val pyInputRefs = GpuBindReferences.bindGpuReferences(udfFlattenedArgs,
         childOutput, allMetrics)
       val miniIter = inputIter.map { batch =>
         mNumInputBatches += 1
@@ -148,7 +151,7 @@ case class GpuAggregateInPandasExec(
 
       // Second splits into separate group batches.
       val miniAttrs =
-        (gpuGroupingExpressions ++ udfArgs.flattenedArgs).asInstanceOf[Seq[Attribute]]
+        (gpuGroupingExpressions ++ udfFlattenedArgs).asInstanceOf[Seq[Attribute]]
       val keyConverter = (groupedBatch: ColumnarBatch) => {
         // No `safeMap` because here does not increase the ref count.
         // (`Seq.indices.map()` is NOT lazy, so it is safe to be used to slice the columns.)
@@ -191,9 +194,9 @@ case class GpuAggregateInPandasExec(
         }
       }
 
-      val runnerFactory = GpuGroupedPythonRunnerFactory(conf, pyFuncs, udfArgs.argOffsets,
+      val runnerFactory = new GpuGroupedPythonRunnerFactory(conf, pyFuncs, udfArgOffsets,
         aggInputSchema, DataTypeUtilsShim.fromAttributes(pyOutAttributes),
-        PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF, udfArgs.argNames)
+        PythonEvalType.SQL_GROUPED_AGG_PANDAS_UDF, udfArgNames)
 
       // Third, sends to Python to execute the aggregate and returns the result.
       if (pyInputIter.hasNext) {
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapCoGroupsInPandasExec.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapCoGroupsInPandasExec.scala
index e4515b40662..968df9dc747 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapCoGroupsInPandasExec.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapCoGroupsInPandasExec.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -138,10 +138,14 @@ case class GpuFlatMapCoGroupsInPandasExec(
       StructField("out_struct", DataTypeUtilsShim.fromAttributes(output)) :: Nil)
 
     // Resolve the argument offsets and related attributes.
-    val GroupArgs(leftDedupAttrs, leftArgOffsets, leftGroupingOffsets) =
-      resolveArgOffsets(left, leftGroup)
-    val GroupArgs(rightDedupAttrs, rightArgOffsets, rightGroupingOffsets) =
-      resolveArgOffsets(right, rightGroup)
+    val leftGroupArgs = resolveArgOffsets(left, leftGroup)
+    val leftDedupAttrs = leftGroupArgs.dedupAttrs
+    val leftArgOffsets = leftGroupArgs.argOffsets
+    val leftGroupingOffsets = leftGroupArgs.groupingOffsets
+    val rightGroupArgs = resolveArgOffsets(right, rightGroup)
+    val rightDedupAttrs = rightGroupArgs.dedupAttrs
+    val rightArgOffsets = rightGroupArgs.argOffsets
+    val rightGroupingOffsets = rightGroupArgs.groupingOffsets
 
     left.executeColumnar().zipPartitions(right.executeColumnar())  { (leftIter, rightIter) =>
       if (isPythonOnGpuEnabled) {
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapGroupsInPandasExec.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapGroupsInPandasExec.scala
index 27dd4ae65ba..2d69892d988 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapGroupsInPandasExec.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuFlatMapGroupsInPandasExec.scala
@@ -119,12 +119,14 @@ case class GpuFlatMapGroupsInPandasExec(
         StructField("out_struct", DataTypeUtilsShim.fromAttributes(localOutput)) :: Nil)
 
     // Resolve the argument offsets and related attributes.
-    val GroupArgs(dedupAttrs, argOffsets, groupingOffsets) =
-        resolveArgOffsets(child, groupingAttributes)
+    val groupArgs = resolveArgOffsets(child, groupingAttributes)
+    val dedupAttrs = groupArgs.dedupAttrs
+    val argOffsets = groupArgs.argOffsets
+    val groupingOffsets = groupArgs.groupingOffsets
 
-    val runnerFactory = GpuGroupedPythonRunnerFactory(conf, chainedFunc, Array(argOffsets),
+    val runnerFactory = new GpuGroupedPythonRunnerFactory(conf, chainedFunc, Array(argOffsets),
         DataTypeUtilsShim.fromAttributes(dedupAttrs), pythonOutputSchema,
-        udf.evalType)
+        udf.evalType, None)
 
     // Start processing. Map grouped batches to ArrowPythonRunner results.
     child.executeColumnar().mapPartitionsInternal { inputIter =>
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonHelper.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonHelper.scala
index 56da226495a..7f6c780d33a 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonHelper.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonHelper.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,12 +22,26 @@ import com.nvidia.spark.rapids.python.PythonConfEntries._
 
 import org.apache.spark.{SparkConf, SparkEnv}
 import org.apache.spark.api.python.ChainedPythonFunctions
-import org.apache.spark.internal.Logging
 import org.apache.spark.internal.config.{CPUS_PER_TASK, EXECUTOR_CORES}
 import org.apache.spark.internal.config.Python._
 import org.apache.spark.sql.internal.SQLConf
 
-object GpuPythonHelper extends Logging {
+object GpuPythonHelper {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(GpuPythonHelper.getClass)
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   private val sparkConf = SparkEnv.get.conf
   private lazy val rapidsConf = new RapidsConf(sparkConf)
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonUDF.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonUDF.scala
index 04367d9f29f..d0cbc26e26d 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonUDF.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/execution/python/GpuPythonUDF.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/predicates.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/predicates.scala
index fb956738e18..f6f961f540b 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/predicates.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/predicates.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -20,7 +20,7 @@ import ai.rapids.cudf._
 import ai.rapids.cudf.ast.BinaryOperator
 import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.Arm.withResource
-import com.nvidia.spark.rapids.shims.NullIntolerantShim
+import com.nvidia.spark.rapids.shims.{NullIntolerantShim, ShimPredicate}
 
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult
 import org.apache.spark.sql.catalyst.expressions._
@@ -30,7 +30,7 @@ import org.apache.spark.sql.vectorized.ColumnarBatch
 
 
 case class GpuNot(child: Expression) extends CudfUnaryExpression
-    with Predicate with ImplicitCastInputTypes with NullIntolerantShim {
+    with ShimPredicate with ImplicitCastInputTypes with NullIntolerantShim {
   override def toString: String = s"NOT $child"
 
   override def inputTypes: Seq[DataType] = Seq(BooleanType)
@@ -51,7 +51,7 @@ case class GpuNot(child: Expression) extends CudfUnaryExpression
   }
 }
 
-abstract class CudfBinaryPredicateWithSideEffect extends CudfBinaryOperator with Predicate {
+abstract class CudfBinaryPredicateWithSideEffect extends CudfBinaryOperator with ShimPredicate {
 
   override def inputType: AbstractDataType = BooleanType
 
@@ -152,7 +152,7 @@ case class GpuOr(left: Expression, right: Expression) extends CudfBinaryPredicat
     GpuExpressionWithSideEffectUtils.boolInverted(col)
 }
 
-abstract class CudfBinaryComparison extends CudfBinaryOperator with Predicate {
+abstract class CudfBinaryComparison extends CudfBinaryOperator with ShimPredicate {
   // Note that we need to give a superset of allowable input types since orderable types are not
   // finitely enumerable. The allowable types are checked below by checkInputDataTypes.
   override def inputType: AbstractDataType = AnyDataType
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/shims/RapidsQueryErrorUtils.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/shims/RapidsQueryErrorUtils.scala
index 5ac79327380..cc5121655ca 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/shims/RapidsQueryErrorUtils.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/shims/RapidsQueryErrorUtils.scala
@@ -96,6 +96,6 @@ trait RapidsQueryErrorUtils {
   }
 
   def dynamicPartitionParentError: Throwable = {
-    throw new RapidsAnalysisException(ErrorMsg.PARTITION_DYN_STA_ORDER.getMsg)
+    throw RapidsAnalysisException(ErrorMsg.PARTITION_DYN_STA_ORDER.getMsg)
   }
 }
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/stringFunctions.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/stringFunctions.scala
index 2b146a07cee..09d2f5db33b 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/stringFunctions.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/stringFunctions.scala
@@ -34,7 +34,7 @@ import com.nvidia.spark.rapids.jni.CharsetDecode
 import com.nvidia.spark.rapids.jni.GpuSubstringIndexUtils
 import com.nvidia.spark.rapids.jni.NumberConverter
 import com.nvidia.spark.rapids.jni.RegexRewriteUtils
-import com.nvidia.spark.rapids.shims.{NullIntolerantShim, ShimExpression, SparkShimImpl}
+import com.nvidia.spark.rapids.shims.{NullIntolerantShim, ShimExpression, ShimPredicate, SparkShimImpl}
 
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.errors.ConvUtils
@@ -163,7 +163,7 @@ case class GpuStringLocate(substr: Expression, col: Expression, start: Expressio
 
 case class GpuStartsWith(left: Expression, right: Expression)
   extends GpuBinaryExpressionArgsAnyScalar
-      with Predicate
+      with ShimPredicate
       with ImplicitCastInputTypes
       with NullIntolerantShim {
 
@@ -189,7 +189,7 @@ case class GpuStartsWith(left: Expression, right: Expression)
 
 case class GpuEndsWith(left: Expression, right: Expression)
   extends GpuBinaryExpressionArgsAnyScalar
-      with Predicate
+      with ShimPredicate
       with ImplicitCastInputTypes
       with NullIntolerantShim {
 
@@ -396,7 +396,7 @@ case class GpuConcatWs(children: Seq[Expression])
 
 case class GpuContains(left: Expression, right: Expression)
     extends GpuBinaryExpression
-        with Predicate
+        with ShimPredicate
         with ImplicitCastInputTypes
         with NullIntolerantShim
         with GpuCombinable {
@@ -496,7 +496,7 @@ class ContainsCombiner(private val exp: GpuContains) extends GpuExpressionCombin
   override def addExpression(e: Expression): Unit = {
     val localOutputLocation = outputLocation
     outputLocation += 1
-    val key = GpuExpressionEquals(e)
+    val key = new GpuExpressionEquals(e)
     if (!toCombine.contains(key)) {
       toCombine.put(key, localOutputLocation)
     }
@@ -530,7 +530,7 @@ class ContainsCombiner(private val exp: GpuContains) extends GpuExpressionCombin
   }
 
   override def getReplacementExpression(e: Expression): Option[Expression] = {
-    toCombine.get(GpuExpressionEquals(e)).map { localId =>
+    toCombine.get(new GpuExpressionEquals(e)).map { localId =>
       GpuGetStructField(multiContains, localId, Some(fieldName(localId)))
     }
   }
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/test/cpuJsonExpressions.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/test/cpuJsonExpressions.scala
index 0dd048967a8..60e738e4c6f 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/test/cpuJsonExpressions.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/test/cpuJsonExpressions.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -34,7 +34,8 @@ import org.apache.spark.sql.catalyst.expressions.{GetJsonObject, Literal}
 import org.apache.spark.sql.types.StringType
 import org.apache.spark.unsafe.types.UTF8String
 
-case class CsvWriterWrapper(filePath: String, conf: Configuration) extends AutoCloseable {
+class CsvWriterWrapper(val filePath: String, val conf: Configuration) extends AutoCloseable
+    with Serializable {
 
   // This is implemented as a method to make it easier to subclass
   // ColumnarOutputWriter in the tests, and override this behavior.
@@ -262,7 +263,7 @@ object CpuGetJsonObject {
         val date = DateTimeFormatter.ofPattern("yyyyMMdd").format(LocalDate.now())
         val uuid = UUID.randomUUID()
         val savePath = s"$savePathForVerify/${date}_${tcId}_${uuid}.csv"
-        withResource(CsvWriterWrapper(savePath, conf)) { csvWriter =>
+        withResource(new CsvWriterWrapper(savePath, conf)) { csvWriter =>
           val pathStr = if (path == null) "null" else path.toString
           var currRow = 0
           var diffRowsNum = 0
diff --git a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/zorder/ZOrderRules.scala b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/zorder/ZOrderRules.scala
index bb56e8a7602..d4e342188f7 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/zorder/ZOrderRules.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/sql/rapids/zorder/ZOrderRules.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -97,7 +97,7 @@ object ZOrderRules {
           TypeSig.BINARY,
           TypeSig.BINARY,
           repeatingParamCheck =
-            Some(RepeatingParamCheck("input",
+            Some(new RepeatingParamCheck("input",
               TypeSig.INT,
               TypeSig.INT))),
         (a, conf, p, r) => new ExprMeta[Expression](a, conf, p, r) {
@@ -129,7 +129,7 @@ object ZOrderRules {
           TypeSig.LONG,
           TypeSig.LONG,
           repeatingParamCheck =
-            Some(RepeatingParamCheck("input",
+            Some(new RepeatingParamCheck("input",
               TypeSig.INT,
               TypeSig.INT))),
         (a, conf, p, r) => new ExprMeta[Expression](a, conf, p, r) {
diff --git a/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsPushBasedFetchHelper.scala b/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsPushBasedFetchHelper.scala
index 18f53e74060..7945d28dbc2 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsPushBasedFetchHelper.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsPushBasedFetchHelper.scala
@@ -27,7 +27,6 @@ import org.roaringbitmap.RoaringBitmap
 
 import org.apache.spark.MapOutputTracker
 import org.apache.spark.MapOutputTracker.SHUFFLE_PUSH_MAP_ID
-import org.apache.spark.internal.Logging
 import org.apache.spark.network.shuffle.{BlockStoreClient, MergedBlockMeta, MergedBlocksMetaListener}
 import org.apache.spark.storage.BlockManagerId.SHUFFLE_MERGER_IDENTIFIER
 import org.apache.spark.storage.RapidsShuffleBlockFetcherIterator._
@@ -52,7 +51,39 @@ private class RapidsPushBasedFetchHelper(
    private val iterator: RapidsShuffleBlockFetcherIterator,
    private val shuffleClient: BlockStoreClient,
    private val blockManager: BlockManager,
-   private val mapOutputTracker: MapOutputTracker) extends Logging {
+   private val mapOutputTracker: MapOutputTracker) {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(classOf[RapidsPushBasedFetchHelper])
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg, throwable)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg, throwable)
+    }
+  }
 
   private[this] val startTimeNs = System.nanoTime()
 
diff --git a/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsShuffleBlockFetcherIterator.scala b/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsShuffleBlockFetcherIterator.scala
index eb48fc3afdb..a33094fdb63 100644
--- a/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsShuffleBlockFetcherIterator.scala
+++ b/sql-plugin/src/main/scala/org/apache/spark/storage/RapidsShuffleBlockFetcherIterator.scala
@@ -33,7 +33,7 @@ import org.roaringbitmap.RoaringBitmap
 import org.apache.spark.{MapOutputTracker, SparkEnv, TaskContext}
 import org.apache.spark.MapOutputTracker.SHUFFLE_PUSH_MAP_ID
 import org.apache.spark.SparkException
-import org.apache.spark.internal.{config, Logging}
+import org.apache.spark.internal.config
 import org.apache.spark.network.buffer.{FileSegmentManagedBuffer, ManagedBuffer}
 import org.apache.spark.network.shuffle._
 import org.apache.spark.network.shuffle.checksum.{Cause, ShuffleChecksumHelper}
@@ -115,7 +115,51 @@ final class RapidsShuffleBlockFetcherIterator(
     checksumAlgorithm: String,
     shuffleMetrics: ShuffleReadMetricsReporter,
     doBatchFetch: Boolean)
-  extends Iterator[(BlockId, InputStream)] with DownloadFileManager with Logging {
+  extends Iterator[(BlockId, InputStream)] with DownloadFileManager {
+
+  private val log = org.slf4j.LoggerFactory.getLogger(getClass.getName.stripSuffix("$"))
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logWarning(msg: => String, throwable: Throwable): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg, throwable)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logTrace(msg: => String): Unit = {
+    if (log.isTraceEnabled) {
+      log.trace(msg)
+    }
+  }
+
+  private def logError(msg: => String): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg)
+    }
+  }
+
+  private def logError(msg: => String, throwable: Throwable): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg, throwable)
+    }
+  }
 
   import RapidsShuffleBlockFetcherIterator._
 
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala
deleted file mode 100644
index 6aee8860df3..00000000000
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/CastTimeToIntShim.scala
+++ /dev/null
@@ -1,47 +0,0 @@
-/*
- * Copyright (c) 2025-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-{"spark": "340"}
-{"spark": "341"}
-{"spark": "341db"}
-{"spark": "342"}
-{"spark": "343"}
-{"spark": "344"}
-{"spark": "350"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
-
-object CastTimeToIntShim {
-  // Whether to set overflow rows to nulls when casting timestamps to integrals,
-  // when ANSI is disabled.
-  def ifNullifyOverflows: Boolean = false
-}
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DateTimeUtilsShims.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DateTimeUtilsShims.scala
deleted file mode 100644
index 5665626023b..00000000000
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/DateTimeUtilsShims.scala
+++ /dev/null
@@ -1,48 +0,0 @@
-/*
- * Copyright (c) 2024-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-{"spark": "340"}
-{"spark": "341"}
-{"spark": "341db"}
-{"spark": "342"}
-{"spark": "343"}
-{"spark": "344"}
-{"spark": "350"}
-{"spark": "350db143"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
-
-import org.apache.spark.sql.catalyst.util.DateTimeUtils
-
-object DateTimeUtilsShims {
-  def currentTimestamp: Long = DateTimeUtils.currentTimestamp()
-}
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala
deleted file mode 100644
index f0dea3c6ab6..00000000000
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/GetJsonObjectShim.scala
+++ /dev/null
@@ -1,57 +0,0 @@
-/*
- * Copyright (c) 2025-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-{"spark": "340"}
-{"spark": "341"}
-{"spark": "341db"}
-{"spark": "342"}
-{"spark": "343"}
-{"spark": "344"}
-{"spark": "350"}
-{"spark": "350db143"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
-
-object GetJsonObjectShim {
-  /**
-   * Return a shim string for a part in named Regexp.
-   * For Spark versions before 400, named Regexp is:
-   *   name <- '.' ~> "[^\\.\\[]+".r | "['" ~> "[^\\'\\?]+".r <~ "']"
-   * For Spark versions 400 and 400+, named Regexp is:
-   *   name <- '.' ~> "[^\\.\\[]+".r | "['" ~> "[^\\']+".r <~ "']"
-   * This is the shim to distinct "[^\\'\\?]+" and "[^\\']+"
-   *
-   * "[^\\'\\?]+" : One or more chars which are not: ' or ?
-   * "[^\\']+"    : One or more chars which are not: '
-   */
-  def partRegexpInNamed: String = "[^\\'\\?]+"
-}
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala
index 4f7be08da15..4718765a0c5 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala
@@ -32,13 +32,14 @@ spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.internal.SQLConf.LegacyBehaviorPolicy
 
+// Keep executable line numbers aligned with the newer shim so binary-dedupe
+// can recognize the common module class.
 object LegacyBehaviorPolicyShim {
-  val CORRECTED_STR: String =  LegacyBehaviorPolicy.CORRECTED.toString
-  val EXCEPTION_STR: String =  LegacyBehaviorPolicy.EXCEPTION.toString
+  val CORRECTED_STR: String = "CORRECTED"
+  val EXCEPTION_STR: String = "EXCEPTION"
 
   def isLegacyTimeParserPolicy(): Boolean = {
-    SQLConf.get.legacyTimeParserPolicy == LegacyBehaviorPolicy.LEGACY
+    SQLConf.get.legacyTimeParserPolicy.toString == "LEGACY"
   }
-}
\ No newline at end of file
+}
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala
index 3e5748682a0..6af4f2dc104 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala
@@ -43,4 +43,27 @@ package com.nvidia.spark.rapids.shims
 
 import org.apache.spark.sql.catalyst.expressions.NullIntolerant
 
-trait NullIntolerantShim extends NullIntolerant
+trait NullIntolerantShim extends NullIntolerant {
+  def nullIntolerant: Boolean = true
+}
+
+abstract class GpuLiteralShim extends com.nvidia.spark.rapids.GpuLeafExpression {
+  def value: Any
+  def dataType: org.apache.spark.sql.types.DataType
+
+  override protected def jsonFields: List[org.json4s.JsonAST.JField] = {
+    val jsonValue = (value, dataType) match {
+      case (null, _) => org.json4s.JsonAST.JNull
+      case (i: Int, org.apache.spark.sql.types.DateType) =>
+        org.json4s.JsonAST.JString(
+          org.apache.spark.sql.catalyst.util.DateTimeUtils.toJavaDate(i).toString)
+      case (l: Long, org.apache.spark.sql.types.TimestampType) =>
+        org.json4s.JsonAST.JString(
+          org.apache.spark.sql.catalyst.util.DateTimeUtils.toJavaTimestamp(l).toString)
+      case (other, _) => org.json4s.JsonAST.JString(other.toString)
+    }
+    ("value" -> jsonValue) ::
+      ("dataType" -> org.apache.spark.sql.rapids.execution.TrampolineUtil.jsonValue(dataType)
+        .asInstanceOf[org.json4s.JsonAST.JValue]) :: Nil
+  }
+}
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala
index c4c4cbebbbd..85552b9b408 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala
@@ -31,8 +31,13 @@
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
-import org.apache.commons.io.output.NullOutputStream
+import java.io.OutputStream
+
+// Keep executable line numbers aligned with newer shims for binary-dedupe.
 
 object NullOutputStreamShim {
-  def INSTANCE = NullOutputStream.NULL_OUTPUT_STREAM
+  val INSTANCE: OutputStream = new OutputStream {
+    override def write(b: Int): Unit = {}
+    override def write(b: Array[Byte], off: Int, len: Int): Unit = {}
+  }
 }
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala
index 225429ec697..5d379ef3b59 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala
@@ -23,25 +23,85 @@
 {"spark": "333"}
 {"spark": "334"}
 spark-rapids-shim-json-lines ***/
+// Keep executable line numbers aligned with newer shims for binary-dedupe.
+
+
+
+
+
+
+
+
+
+
+
+
+
+
 package com.nvidia.spark.rapids.shims
 
-import com.google.protobuf.{AbstractMessage, CodedOutputStream}
+import java.io.OutputStream
+import java.lang.reflect.Method
+
 import org.apache.orc.impl.OutStream
 
 class OrcProtoWriterShim(orcOutStream: OutStream) {
-  val proxied = CodedOutputStream.newInstance(orcOutStream)
-  def writeAndFlush(obj: Any): Unit = obj match {
-    case m: AbstractMessage =>
-      m.writeTo(proxied)
-      proxied.flush()
-      orcOutStream.flush()
-    case _ =>
-      require(obj.isInstanceOf[AbstractMessage],
-        s"Unexpected protobuf message type: $obj")
+  import OrcProtoWriterShim.ProtoApi
+
+  private[this] var proxiedApi: ProtoApi = _
+  private[this] var proxied: AnyRef = _
+
+  private def proxiedFor(api: ProtoApi): AnyRef = {
+    if (proxiedApi != api) {
+      proxiedApi = api
+      proxied = api.newInstance.invoke(null, orcOutStream.asInstanceOf[OutputStream])
+    }
+    proxied
+  }
+
+  def writeAndFlush(obj: Any): Unit = {
+    val api = OrcProtoWriterShim.apiFor(obj).getOrElse {
+      throw new IllegalArgumentException(
+        s"requirement failed: Unexpected protobuf message type: $obj")
+    }
+    val currentProxied = proxiedFor(api)
+    api.writeTo.invoke(obj.asInstanceOf[AnyRef], currentProxied)
+    api.flush.invoke(currentProxied)
+    orcOutStream.flush()
   }
 }
 
 object OrcProtoWriterShim {
+  private case class ProtoApi(
+      messageClass: Class[_],
+      newInstance: Method,
+      writeTo: Method,
+      flush: Method)
+
+  private val protoClassNames = Seq(
+    ("org.apache.orc.protobuf.AbstractMessage",
+      "org.apache.orc.protobuf.CodedOutputStream"),
+    ("com.google.protobuf.AbstractMessage",
+      "com.google.protobuf.CodedOutputStream"))
+
+  private lazy val protoApis: Seq[ProtoApi] = protoClassNames.flatMap { case (msg, out) =>
+    try {
+      val messageClass = Class.forName(msg)
+      val codedOutputStreamClass = Class.forName(out)
+      Some(ProtoApi(
+        messageClass,
+        codedOutputStreamClass.getMethod("newInstance", classOf[OutputStream]),
+        messageClass.getMethod("writeTo", codedOutputStreamClass),
+        codedOutputStreamClass.getMethod("flush")))
+    } catch {
+      case _: ReflectiveOperationException => None
+    }
+  }
+
+  private def apiFor(obj: Any): Option[ProtoApi] = {
+    protoApis.find(_.messageClass.isInstance(obj))
+  }
+
   def apply(orcOutStream: OutStream) = {
     new OrcProtoWriterShim(orcOutStream)
   }
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala
new file mode 100644
index 00000000000..3fec849dc36
--- /dev/null
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala
@@ -0,0 +1,73 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*** spark-rapids-shim-json-lines
+{"spark": "330"}
+{"spark": "330db"}
+{"spark": "331"}
+{"spark": "332"}
+{"spark": "332db"}
+{"spark": "333"}
+{"spark": "334"}
+{"spark": "340"}
+{"spark": "341"}
+{"spark": "341db"}
+{"spark": "342"}
+{"spark": "343"}
+{"spark": "344"}
+{"spark": "350"}
+{"spark": "350db143"}
+{"spark": "351"}
+{"spark": "352"}
+{"spark": "353"}
+{"spark": "354"}
+{"spark": "355"}
+{"spark": "356"}
+{"spark": "357"}
+{"spark": "358"}
+spark-rapids-shim-json-lines ***/
+package com.nvidia.spark.rapids.shims
+
+import org.apache.spark.sql.catalyst.expressions.Predicate
+
+trait ShimPredicate extends Predicate {
+  def contextIndependentFoldable: Boolean = children.forall(_.foldable)
+}
+
+trait ShimDataWritingCommand
+    extends org.apache.spark.sql.execution.command.DataWritingCommand
+    with ShimUnaryCommand {
+  def runColumnar(
+      sparkSession: org.apache.spark.sql.SparkSession,
+      child: org.apache.spark.sql.execution.SparkPlan):
+      Seq[org.apache.spark.sql.vectorized.ColumnarBatch]
+
+  def runColumnarFromAny(
+      sparkSession: AnyRef,
+      child: org.apache.spark.sql.execution.SparkPlan):
+      Seq[org.apache.spark.sql.vectorized.ColumnarBatch] = {
+    runColumnar(sparkSession.asInstanceOf[org.apache.spark.sql.SparkSession], child)
+  }
+
+  override def run(
+      sparkSession: org.apache.spark.sql.SparkSession,
+      child: org.apache.spark.sql.execution.SparkPlan): Seq[org.apache.spark.sql.Row] = {
+    com.nvidia.spark.rapids.Arm.withResource(runColumnar(sparkSession, child)) { batches =>
+      assert(batches.isEmpty)
+    }
+    Seq.empty[org.apache.spark.sql.Row]
+  }
+}
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/ShuffleOriginUtil.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/ShuffleOriginUtil.scala
index c3176b39a6e..2f9f67c4672 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/ShuffleOriginUtil.scala
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/ShuffleOriginUtil.scala
@@ -25,6 +25,19 @@ package com.nvidia.spark.rapids.shims
 
 import org.apache.spark.sql.execution.exchange.{ENSURE_REQUIREMENTS, REBALANCE_PARTITIONS_BY_COL, REBALANCE_PARTITIONS_BY_NONE, REPARTITION_BY_COL, REPARTITION_BY_NUM, ShuffleOrigin}
 
+// Keep executable line numbers aligned with newer shims for binary-dedupe.
+
+
+
+
+
+
+
+
+
+
+
+
 object ShuffleOriginUtil {
   private val knownOrigins: Set[ShuffleOrigin] = Set(ENSURE_REQUIREMENTS,
     REPARTITION_BY_COL, REPARTITION_BY_NUM, REBALANCE_PARTITIONS_BY_NONE,
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SparkShims.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
index f0f81947d6b..cb155d92d5c 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,14 +21,15 @@ package com.nvidia.spark.rapids.shims
 
 import com.nvidia.spark.rapids._
 
-import org.apache.spark.sql.execution.command.{CreateDataSourceTableAsSelectCommand, DataWritingCommand, RunnableCommand}
+import org.apache.spark.sql.execution.command.{DataWritingCommand, RunnableCommand}
 
 object SparkShimImpl extends Spark330PlusShims with AnsiCastRuleShims {
   override def getDataWriteCmds: Map[Class[_ <: DataWritingCommand],
       DataWritingCommandRule[_ <: DataWritingCommand]] = {
-    Seq(GpuOverrides.dataWriteCmd[CreateDataSourceTableAsSelectCommand](
-    "Create table with select command",
-    (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
+    Seq(
+      GpuOverrides.dataWriteCmdFromShim(
+        CreateDataSourceTableAsSelectRules.dataWriteCmd,
+        (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
     ).map(r => (r.getClassFor.asSubclass(classOf[DataWritingCommand]), r)).toMap
   }
 
diff --git a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala
index 1f21cf55c09..1af10fb483d 100644
--- a/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala
+++ b/sql-plugin/src/main/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala
@@ -36,7 +36,6 @@ import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 import com.nvidia.spark.rapids.jni.RmmSpark
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.rapids.{RapidsShuffleFetchFailedException, RapidsShuffleTimeoutException}
 import org.apache.spark.sql.rapids.{GpuShuffleEnv, ShuffleMetricsUpdater}
 import org.apache.spark.sql.types.DataType
@@ -68,8 +67,33 @@ class RapidsShuffleIterator(
     taskAttemptId: Long,
     catalog: ShuffleReceivedBufferCatalog = GpuShuffleEnv.getReceivedCatalog,
     timeoutSeconds: Long = GpuShuffleEnv.shuffleFetchTimeoutSeconds)
-  extends Iterator[ColumnarBatch]
-    with Logging {
+  extends Iterator[ColumnarBatch] {
+  private[this] val log = org.slf4j.LoggerFactory.getLogger(getClass)
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logError(msg: => String): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg)
+    }
+  }
+
 
   /**
    * General trait encapsulating either a buffer or an error. Used to hand off batches
@@ -345,7 +369,7 @@ class RapidsShuffleIterator(
     // thread to schedule the fetches for us, it may be something we consider in the future, given
     // memory pressure.
     // No good way to get a metric in here for semaphore time.
-    taskContext.foreach(GpuSemaphore.acquireIfNecessary)
+    taskContext.foreach(GpuSemaphore.acquireIfNecessary(_))
 
     if (!started) {
       // kick off if we haven't already
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala
deleted file mode 100644
index dc99c9357e3..00000000000
--- a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala
+++ /dev/null
@@ -1,50 +0,0 @@
-/*
- * Copyright (c) 2024-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-{"spark": "340"}
-{"spark": "341"}
-{"spark": "341db"}
-{"spark": "342"}
-{"spark": "343"}
-{"spark": "344"}
-{"spark": "350"}
-{"spark": "350db143"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-spark-rapids-shim-json-lines ***/
-package org.apache.spark.sql.nvidia
-
-import org.apache.spark.sql.Column
-import org.apache.spark.sql.catalyst.expressions.Expression
-
-object DFUDFShims {
-  def columnToExpr(c: Column): Expression = c.expr
-  def exprToColumn(e: Expression): Column = Column(e)
-}
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala
index 224e6f7d7d6..e32030dd40a 100644
--- a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala
+++ b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala
@@ -32,7 +32,6 @@ import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.shuffle.{RapidsShuffleIterator, RapidsShuffleTransport}
 
 import org.apache.spark.{InterruptibleIterator, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.{ShuffleReader, ShuffleReadMetricsReporter}
 import org.apache.spark.sql.types.DataType
 import org.apache.spark.sql.vectorized.ColumnarBatch
@@ -65,7 +64,21 @@ class RapidsCachingReader[K, C](
     transport: Option[RapidsShuffleTransport],
     catalog: ShuffleBufferCatalog,
     sparkTypes: Array[DataType])
-  extends ShuffleReader[K, C] with Logging {
+  extends ShuffleReader[K, C] {
+  private[this] val log = org.slf4j.LoggerFactory.getLogger(getClass)
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   override def read(): Iterator[Product2[K, C]] = {
     NvtxRegistry.RAPIDS_CACHING_READER_READ.push()
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
index 5f91ea0d057..e46695013e3 100644
--- a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
+++ b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
@@ -45,14 +45,14 @@ import org.apache.spark.sql.rapids.shims.ArrowUtilsShim
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-case class GpuGroupedPythonRunnerFactory(
+class GpuGroupedPythonRunnerFactory(
     conf: org.apache.spark.sql.internal.SQLConf,
     chainedFunc: Seq[(ChainedPythonFunctions, Long)],
     argOffsets: Array[Array[Int]],
     dedupAttrs: StructType,
     pythonOutputSchema: StructType,
     evalType: Int,
-    argNames: Option[Array[Array[Option[String]]]] = None) {
+    argNames: Option[Array[Array[Option[String]]]]) extends Serializable {
   val sessionLocalTimeZone = conf.sessionLocalTimeZone
   val pythonRunnerConf = ArrowUtilsShim.getPythonRunnerConfMap(conf)
 
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentUtils.scala b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentUtils.scala
index ce90605c035..3eca24135de 100644
--- a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentUtils.scala
+++ b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentUtils.scala
@@ -64,6 +64,6 @@ object PythonArgumentUtils {
         }
       }.toArray
     }.toArray
-    GpuPythonArguments(allInputs.toSeq, dataTypes.toSeq, argOffsets, None)
+    new GpuPythonArguments(allInputs.toSeq, dataTypes.toSeq, argOffsets, None)
   }
 }
diff --git a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala b/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala
deleted file mode 100644
index c7ec03facf4..00000000000
--- a/sql-plugin/src/main/spark330/scala/org/apache/spark/sql/rapids/shims/SparkSessionUtils.scala
+++ /dev/null
@@ -1,56 +0,0 @@
-/*
- * Copyright (c) 2025-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "330"}
-{"spark": "330db"}
-{"spark": "331"}
-{"spark": "332"}
-{"spark": "332db"}
-{"spark": "333"}
-{"spark": "334"}
-{"spark": "340"}
-{"spark": "341"}
-{"spark": "341db"}
-{"spark": "342"}
-{"spark": "343"}
-{"spark": "344"}
-{"spark": "350"}
-{"spark": "350db143"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-spark-rapids-shim-json-lines ***/
-package org.apache.spark.sql.rapids.shims
-
-import org.apache.spark.sql.SparkSession
-import org.apache.spark.sql.execution.SparkPlan
-
-object SparkSessionUtils {
-
-  def sessionFromPlan(plan: SparkPlan): SparkSession = {
-    plan.session
-  }
-
-  def leafNodeDefaultParallelism(ss: SparkSession): Int = {
-    ss.leafNodeDefaultParallelism
-  }
-}
diff --git a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/CheckOverflowInTableInsertShims.scala b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/CheckOverflowInTableInsertShims.scala
new file mode 100644
index 00000000000..137e72913ae
--- /dev/null
+++ b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/CheckOverflowInTableInsertShims.scala
@@ -0,0 +1,82 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*** spark-rapids-shim-json-lines
+{"spark": "330db"}
+{"spark": "331"}
+{"spark": "332"}
+{"spark": "332db"}
+{"spark": "333"}
+{"spark": "334"}
+{"spark": "340"}
+{"spark": "341"}
+{"spark": "341db"}
+{"spark": "342"}
+{"spark": "343"}
+{"spark": "344"}
+{"spark": "350"}
+{"spark": "350db143"}
+{"spark": "351"}
+{"spark": "352"}
+{"spark": "353"}
+{"spark": "354"}
+{"spark": "355"}
+{"spark": "356"}
+{"spark": "357"}
+{"spark": "358"}
+{"spark": "400"}
+{"spark": "400db173"}
+{"spark": "401"}
+{"spark": "402"}
+{"spark": "411"}
+spark-rapids-shim-json-lines ***/
+package com.nvidia.spark.rapids.shims
+
+import com.nvidia.spark.rapids.{
+  ExprChecks,
+  ExprRule,
+  GpuCast,
+  GpuExpression,
+  GpuOverrides,
+  TypeSig,
+  UnaryExprMeta
+}
+
+import org.apache.spark.sql.catalyst.expressions.{CheckOverflowInTableInsert, Expression}
+import org.apache.spark.sql.rapids.GpuCheckOverflowInTableInsert
+
+object CheckOverflowInTableInsertShims {
+  val exprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = {
+    Seq(
+      // Add expression CheckOverflowInTableInsert starting Spark-3.3.1+.
+      // Accepts all types as input as the child Cast does the type checking and the calculations.
+      GpuOverrides.expr[CheckOverflowInTableInsert](
+        "Casting a numeric value as another numeric type in store assignment",
+        ExprChecks.unaryProjectInputMatchesOutput(
+          TypeSig.all,
+          TypeSig.all),
+        (t, conf, p, r) => new UnaryExprMeta[CheckOverflowInTableInsert](t, conf, p, r) {
+          override def convertToGpu(child: Expression): GpuExpression = {
+            child match {
+              case c: GpuCast => GpuCheckOverflowInTableInsert(c, t.columnName)
+              case _ =>
+                throw new IllegalStateException("Expression child is not of Type GpuCast")
+            }
+          }
+        })
+    ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
+  }
+}
diff --git a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark321PlusDBShims.scala b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark321PlusDBShims.scala
index f86b131dcbd..d11b1c7f7f2 100644
--- a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark321PlusDBShims.scala
+++ b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark321PlusDBShims.scala
@@ -123,8 +123,8 @@ trait Spark321PlusDBShims extends SparkShims
               TypeSig.STRUCT + TypeSig.ARRAY + TypeSig.MAP).nested(),
           TypeSig.all,
           Map("partitionSpec" ->
-              InputCheck(TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128,
-                TypeSig.all))),
+              new InputCheck(TypeSig.commonCudfTypes + TypeSig.NULL + TypeSig.DECIMAL_128,
+                TypeSig.all, List.empty))),
         (runningWindowFunctionExec, conf, p, r) =>
           new GpuRunningWindowExecMeta(runningWindowFunctionExec, conf, p, r)
       )
@@ -139,9 +139,9 @@ trait Spark321PlusDBShims extends SparkShims
       GpuOverrides.expr[EphemeralSubstring](
         "Ephemeral version of substring operator",
         ExprChecks.projectOnly(TypeSig.STRING, TypeSig.STRING + TypeSig.BINARY,
-          Seq(ParamCheck("str", TypeSig.STRING, TypeSig.STRING + TypeSig.BINARY),
-            ParamCheck("pos", TypeSig.INT, TypeSig.INT),
-            ParamCheck("len", TypeSig.INT, TypeSig.INT))),
+          Seq(new ParamCheck("str", TypeSig.STRING, TypeSig.STRING + TypeSig.BINARY),
+            new ParamCheck("pos", TypeSig.INT, TypeSig.INT),
+            new ParamCheck("len", TypeSig.INT, TypeSig.INT))),
         (in, conf, p, r) => new TernaryExprMeta[EphemeralSubstring](in, conf, p, r) {
           override def convertToGpu(
               column: Expression,
diff --git a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark330PlusDBShims.scala b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark330PlusDBShims.scala
index fac3314c709..349368def4f 100644
--- a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark330PlusDBShims.scala
+++ b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/Spark330PlusDBShims.scala
@@ -30,29 +30,16 @@ import org.apache.spark.sql.catalyst.plans.physical.SinglePartition
 import org.apache.spark.sql.execution.{ColumnarToRowTransition, SparkPlan}
 import org.apache.spark.sql.execution.adaptive.ShuffleQueryStageExec
 import org.apache.spark.sql.execution.exchange.{EXECUTOR_BROADCAST, ShuffleExchangeExec, ShuffleExchangeLike}
-import org.apache.spark.sql.rapids.{GpuCheckOverflowInTableInsert, GpuElementAtMeta}
+import org.apache.spark.sql.rapids.GpuElementAtMeta
 import org.apache.spark.sql.rapids.execution.{GpuBroadcastHashJoinExec, GpuBroadcastNestedLoopJoinExec}
 
 trait Spark330PlusDBShims extends Spark321PlusDBShims {
   override def getExprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = {
     val shimExprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = Seq(
-      GpuOverrides.expr[CheckOverflowInTableInsert](
-        "Casting a numeric value as another numeric type in store assignment",
-        ExprChecks.unaryProjectInputMatchesOutput(
-          TypeSig.all,
-          TypeSig.all),
-        (t, conf, p, r) => new UnaryExprMeta[CheckOverflowInTableInsert](t, conf, p, r) {
-          override def convertToGpu(child: Expression): GpuExpression = {
-            child match {
-              case c: GpuCast => GpuCheckOverflowInTableInsert(c, t.columnName)
-              case _ =>
-                throw new IllegalStateException("Expression child is not of Type GpuCast")
-            }
-          }
-        }),
       GpuElementAtMeta.elementAtRule(true)
     ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
-    super.getExprs ++ shimExprs ++ DayTimeIntervalShims.exprs ++ RoundingShims.exprs
+    super.getExprs ++ CheckOverflowInTableInsertShims.exprs ++ shimExprs ++
+        DayTimeIntervalShims.exprs ++ RoundingShims.exprs
   }
 
   override def getExecs: Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]] =
diff --git a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/SparkShims.scala b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
index 84f5c4e4886..324c7718ab5 100644
--- a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
+++ b/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,7 +22,7 @@ package com.nvidia.spark.rapids.shims
 import com.nvidia.spark.rapids._
 
 import org.apache.spark.sql.catalyst.expressions.Expression
-import org.apache.spark.sql.execution.command.{CreateDataSourceTableAsSelectCommand, DataWritingCommand, RunnableCommand}
+import org.apache.spark.sql.execution.command.{DataWritingCommand, RunnableCommand}
 
 object SparkShimImpl extends Spark330PlusDBShims {
   // AnsiCast is removed from Spark3.4.0
@@ -30,9 +30,10 @@ object SparkShimImpl extends Spark330PlusDBShims {
 
   override def getDataWriteCmds: Map[Class[_ <: DataWritingCommand],
       DataWritingCommandRule[_ <: DataWritingCommand]] = {
-    Seq(GpuOverrides.dataWriteCmd[CreateDataSourceTableAsSelectCommand](
-    "Create table with select command",
-    (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
+    Seq(
+      GpuOverrides.dataWriteCmdFromShim(
+        CreateDataSourceTableAsSelectRules.dataWriteCmd,
+        (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
     ).map(r => (r.getClassFor.asSubclass(classOf[DataWritingCommand]), r)).toMap
   }
 
diff --git a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/arithmetic.scala b/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/arithmetic.scala
index 160f93fc34a..a9d2530a443 100644
--- a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/arithmetic.scala
+++ b/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/arithmetic.scala
@@ -49,7 +49,6 @@ import com.nvidia.spark.rapids.Arm.{closeOnExcept, withResource}
 import com.nvidia.spark.rapids.RapidsPluginImplicits._
 import com.nvidia.spark.rapids.shims.NullIntolerantShim
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.analysis.TypeCheckResult
 import org.apache.spark.sql.catalyst.expressions.Expression
 import org.apache.spark.sql.catalyst.trees.{CurrentOrigin, Origin}
@@ -279,7 +278,7 @@ case class GpuDecimalRemainder(
     left: Expression,
     right: Expression,
     failOnError: Boolean = SQLConf.get.ansiEnabled)
-  extends GpuRemainderBase(left, right) with Logging {
+  extends GpuRemainderBase(left, right) {
 
   // scalastyle:off
   // The formula follows Hive which is based on the SQL standard and MS SQL:
diff --git a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala b/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
index 70837659871..02aba89c418 100644
--- a/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
+++ b/sql-plugin/src/main/spark330db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -25,14 +25,14 @@ import org.apache.spark.sql.rapids.shims.ArrowUtilsShim
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-case class GpuGroupedPythonRunnerFactory(
+class GpuGroupedPythonRunnerFactory(
   conf: org.apache.spark.sql.internal.SQLConf,
   chainedFunc: Seq[(ChainedPythonFunctions, Long)],
   argOffsets: Array[Array[Int]],
   dedupAttrs: StructType,
   pythonOutputSchema: StructType,
   evalType: Int,
-  argNames: Option[Array[Array[Option[String]]]] = None) {
+  argNames: Option[Array[Array[Option[String]]]]) extends Serializable {
   // Configs from DB runtime
   val maxBytes = conf.pandasZeroConfConversionGroupbyApplyMaxBytesPerSlice
   val zeroConfEnabled = conf.pandasZeroConfConversionGroupbyApplyEnabled
diff --git a/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/Spark331PlusNonDBShims.scala b/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/Spark331PlusNonDBShims.scala
index a65872ff22e..c36d13c15ed 100644
--- a/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/Spark331PlusNonDBShims.scala
+++ b/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/Spark331PlusNonDBShims.scala
@@ -40,31 +40,12 @@
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
-import com.nvidia.spark.rapids.{ExprChecks, ExprRule, GpuCast, GpuExpression, GpuOverrides, TypeSig, UnaryExprMeta}
+import com.nvidia.spark.rapids.ExprRule
 
-import org.apache.spark.sql.catalyst.expressions.{CheckOverflowInTableInsert, Expression}
-import org.apache.spark.sql.rapids.GpuCheckOverflowInTableInsert
+import org.apache.spark.sql.catalyst.expressions.Expression
 
 trait Spark331PlusNonDBShims extends Spark330PlusNonDBShims {
   override def getExprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = {
-    val map: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = Seq(
-      // Add expression CheckOverflowInTableInsert starting Spark-3.3.1+
-      // Accepts all types as input as the child Cast does the type checking and the calculations.
-      GpuOverrides.expr[CheckOverflowInTableInsert](
-        "Casting a numeric value as another numeric type in store assignment",
-        ExprChecks.unaryProjectInputMatchesOutput(
-          TypeSig.all,
-          TypeSig.all),
-        (t, conf, p, r) => new UnaryExprMeta[CheckOverflowInTableInsert](t, conf, p, r) {
-          override def convertToGpu(child: Expression): GpuExpression = {
-            child match {
-              case c: GpuCast => GpuCheckOverflowInTableInsert(c, t.columnName)
-              case _ =>
-                throw new IllegalStateException("Expression child is not of Type GpuCast")
-            }
-          }
-        })
-    ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
-    super.getExprs ++ map
+    super.getExprs ++ CheckOverflowInTableInsertShims.exprs
   }
 }
diff --git a/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/SparkShims.scala b/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
index 12d59e845d6..f90cc53fdeb 100644
--- a/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
+++ b/sql-plugin/src/main/spark331/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2022-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2022-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -24,14 +24,15 @@ package com.nvidia.spark.rapids.shims
 
 import com.nvidia.spark.rapids._
 
-import org.apache.spark.sql.execution.command.{CreateDataSourceTableAsSelectCommand, DataWritingCommand, RunnableCommand}
+import org.apache.spark.sql.execution.command.{DataWritingCommand, RunnableCommand}
 
 object SparkShimImpl extends Spark331PlusNonDBShims with AnsiCastRuleShims {
   override def getDataWriteCmds: Map[Class[_ <: DataWritingCommand],
       DataWritingCommandRule[_ <: DataWritingCommand]] = {
-    Seq(GpuOverrides.dataWriteCmd[CreateDataSourceTableAsSelectCommand](
-    "Create table with select command",
-    (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
+    Seq(
+      GpuOverrides.dataWriteCmdFromShim(
+        CreateDataSourceTableAsSelectRules.dataWriteCmd,
+        (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
     ).map(r => (r.getClassFor.asSubclass(classOf[DataWritingCommand]), r)).toMap
   }
 
diff --git a/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/Spark332PlusDBShims.scala b/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/Spark332PlusDBShims.scala
index ad235624b6b..83b40cfa7f3 100644
--- a/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/Spark332PlusDBShims.scala
+++ b/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/Spark332PlusDBShims.scala
@@ -26,8 +26,7 @@ import com.nvidia.spark.rapids._
 
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.execution.SparkPlan
-import org.apache.spark.sql.execution.command.{CreateDataSourceTableAsSelectCommand, DataWritingCommand, RunnableCommand}
-import org.apache.spark.sql.execution.datasources._
+import org.apache.spark.sql.execution.command.{DataWritingCommand, RunnableCommand}
 
 trait Spark332PlusDBShims extends Spark330PlusDBShims {
   // AnsiCast is removed from Spark3.4.0
@@ -47,19 +46,8 @@ trait Spark332PlusDBShims extends Spark330PlusDBShims {
     super.getExprs ++ shimExprs
   }
 
-  private val shimExecs: Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]] = Seq(
-    GpuOverrides.exec[WriteFilesExec](
-      "v1 write files",
-      // WriteFilesExec always has patterns:
-      //   InsertIntoHadoopFsRelationCommand(WriteFilesExec) or InsertIntoHiveTable(WriteFilesExec)
-      // The parent node of `WriteFilesExec` will check the types, here just let type check pass
-      ExecChecks(TypeSig.all, TypeSig.all),
-      (write, conf, p, r) => new GpuWriteFilesMeta(write, conf, p, r)
-    )
-  ).map(r => (r.getClassFor.asSubclass(classOf[SparkPlan]), r)).toMap
-
   override def getExecs: Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]] =
-    super.getExecs ++ shimExecs
+    super.getExecs ++ WriteFilesExecRule.execs
 
   override def getDataWriteCmds: Map[Class[_ <: DataWritingCommand],
     DataWritingCommandRule[_ <: DataWritingCommand]] = {
@@ -71,8 +59,8 @@ trait Spark332PlusDBShims extends Spark330PlusDBShims {
   override def getRunnableCmds: Map[Class[_ <: RunnableCommand],
     RunnableCommandRule[_ <: RunnableCommand]] = {
     Seq(
-      GpuOverrides.runnableCmd[CreateDataSourceTableAsSelectCommand](
-        "Write to a data source",
+      GpuOverrides.runnableCmdFromShim(
+        CreateDataSourceTableAsSelectRules.runnableCmd,
         (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
     ).map(r => (r.getClassFor.asSubclass(classOf[RunnableCommand]), r)).toMap
   }
diff --git a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala b/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/WriteFilesExecRule.scala
similarity index 53%
rename from sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
rename to sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/WriteFilesExecRule.scala
index c367c1c4f68..cc331765954 100644
--- a/sql-plugin/src/main/spark330db/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
+++ b/sql-plugin/src/main/spark332db/scala/com/nvidia/spark/rapids/shims/WriteFilesExecRule.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ * Copyright (c) 2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -15,7 +15,6 @@
  */
 
 /*** spark-rapids-shim-json-lines
-{"spark": "330db"}
 {"spark": "332db"}
 {"spark": "340"}
 {"spark": "341"}
@@ -34,29 +33,30 @@
 {"spark": "357"}
 {"spark": "358"}
 {"spark": "400"}
+{"spark": "400db173"}
 {"spark": "401"}
 {"spark": "402"}
+{"spark": "411"}
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
-import org.apache.spark.sql.catalyst.expressions.{Add, Divide, EvalMode, Expression, Multiply, Remainder, Subtract}
-import org.apache.spark.sql.catalyst.expressions.aggregate.{Average, Sum}
+import com.nvidia.spark.rapids.{ExecChecks, ExecRule, GpuOverrides, TypeSig}
 
-object TryModeShim {
-  /**
-   * Check if an expression is in TRY mode.
-   */
-  def isTryMode(expr: Expression): Boolean = {
-    val evalMode = expr match {
-      case add: Add => add.evalMode
-      case sub: Subtract => sub.evalMode
-      case mul: Multiply => mul.evalMode
-      case div: Divide => div.evalMode
-      case mod: Remainder => mod.evalMode
-      case avg: Average => avg.evalMode
-      case sum: Sum => sum.evalMode
-      case _ => throw new RuntimeException(s"Unsupported expression $expr in TRY mode")
-    }
-    evalMode == EvalMode.TRY
+import org.apache.spark.sql.execution.SparkPlan
+import org.apache.spark.sql.execution.datasources.GpuWriteFilesMeta
+
+object WriteFilesExecRule {
+  val execs: Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]] = {
+    Seq(
+      GpuOverrides.execFromShim(
+        WriteFilesExecShims.exec,
+        // WriteFilesExec always has patterns:
+        //   InsertIntoHadoopFsRelationCommand(WriteFilesExec) or
+        //   InsertIntoHiveTable(WriteFilesExec)
+        // The parent node of `WriteFilesExec` will check the types, here just let type check pass.
+        ExecChecks(TypeSig.all, TypeSig.all),
+        (write, conf, p, r) => new GpuWriteFilesMeta(write, conf, p, r)
+      )
+    ).map(r => (r.getClassFor.asSubclass(classOf[SparkPlan]), r)).toMap
   }
 }
diff --git a/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/hive/rapids/shims/HiveFileUtil.scala b/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/hive/rapids/shims/HiveFileUtil.scala
index 307f0e14665..37e1c8b86c2 100644
--- a/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/hive/rapids/shims/HiveFileUtil.scala
+++ b/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/hive/rapids/shims/HiveFileUtil.scala
@@ -45,9 +45,15 @@ import scala.util.control.NonFatal
 import org.apache.hadoop.conf.Configuration
 import org.apache.hadoop.fs.Path
 
-import org.apache.spark.internal.Logging
+object HiveFileUtil {
+  private val log = org.slf4j.LoggerFactory.getLogger(HiveFileUtil.getClass)
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
 
-object HiveFileUtil extends Logging {
 
   // prior to Spark 3.4.0, this method was accessible via the SaveAsHiveFile trait, but
   // was removed in https://github.com/apache/spark/pull/39277
diff --git a/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/GpuFileFormatWriter.scala b/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/GpuFileFormatWriter.scala
index 51d0067bf1c..13dcd2c69fb 100644
--- a/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/GpuFileFormatWriter.scala
+++ b/sql-plugin/src/main/spark332db/scala/org/apache/spark/sql/rapids/GpuFileFormatWriter.scala
@@ -533,7 +533,7 @@ trait GpuFileFormatWriterBase extends Serializable with Logging {
   private def verifySchema(format: ColumnarFileFormat, schema: StructType): Unit = {
     schema.foreach { field =>
       if (!format.supportDataType(field.dataType)) {
-        throw new RapidsAnalysisException(
+        throw RapidsAnalysisException(
           s"$format data source does not support ${field.dataType.catalogString} data type.")
       }
     }
diff --git a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala b/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala
index 047f25fd910..0e812573805 100644
--- a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala
+++ b/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/OrcProtoWriterShim.scala
@@ -40,23 +40,68 @@
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
+import java.io.OutputStream
+import java.lang.reflect.Method
+
 import org.apache.orc.impl.OutStream
-import org.apache.orc.protobuf.{AbstractMessage, CodedOutputStream}
 
 class OrcProtoWriterShim(orcOutStream: OutStream) {
-  val proxied = CodedOutputStream.newInstance(orcOutStream)
-  def writeAndFlush(obj: Any): Unit = obj match {
-    case m: AbstractMessage =>
-      m.writeTo(proxied)
-      proxied.flush()
-      orcOutStream.flush()
-    case _ =>
-      require(obj.isInstanceOf[AbstractMessage],
-        s"Unexpected protobuf message type: $obj")
+  import OrcProtoWriterShim.ProtoApi
+
+  private[this] var proxiedApi: ProtoApi = _
+  private[this] var proxied: AnyRef = _
+
+  private def proxiedFor(api: ProtoApi): AnyRef = {
+    if (proxiedApi != api) {
+      proxiedApi = api
+      proxied = api.newInstance.invoke(null, orcOutStream.asInstanceOf[OutputStream])
+    }
+    proxied
+  }
+
+  def writeAndFlush(obj: Any): Unit = {
+    val api = OrcProtoWriterShim.apiFor(obj).getOrElse {
+      throw new IllegalArgumentException(
+        s"requirement failed: Unexpected protobuf message type: $obj")
+    }
+    val currentProxied = proxiedFor(api)
+    api.writeTo.invoke(obj.asInstanceOf[AnyRef], currentProxied)
+    api.flush.invoke(currentProxied)
+    orcOutStream.flush()
   }
 }
 
 object OrcProtoWriterShim {
+  private case class ProtoApi(
+      messageClass: Class[_],
+      newInstance: Method,
+      writeTo: Method,
+      flush: Method)
+
+  private val protoClassNames = Seq(
+    ("org.apache.orc.protobuf.AbstractMessage",
+      "org.apache.orc.protobuf.CodedOutputStream"),
+    ("com.google.protobuf.AbstractMessage",
+      "com.google.protobuf.CodedOutputStream"))
+
+  private lazy val protoApis: Seq[ProtoApi] = protoClassNames.flatMap { case (msg, out) =>
+    try {
+      val messageClass = Class.forName(msg)
+      val codedOutputStreamClass = Class.forName(out)
+      Some(ProtoApi(
+        messageClass,
+        codedOutputStreamClass.getMethod("newInstance", classOf[OutputStream]),
+        messageClass.getMethod("writeTo", codedOutputStreamClass),
+        codedOutputStreamClass.getMethod("flush")))
+    } catch {
+      case _: ReflectiveOperationException => None
+    }
+  }
+
+  private def apiFor(obj: Any): Option[ProtoApi] = {
+    protoApis.find(_.messageClass.isInstance(obj))
+  }
+
   def apply(orcOutStream: OutStream) = {
     new OrcProtoWriterShim(orcOutStream)
   }
diff --git a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/Spark340PlusNonDBShims.scala b/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/Spark340PlusNonDBShims.scala
index 88c62eea41b..2276a9685db 100644
--- a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/Spark340PlusNonDBShims.scala
+++ b/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shims/Spark340PlusNonDBShims.scala
@@ -43,8 +43,7 @@ import org.apache.spark.rapids.shims.GpuShuffleExchangeExec
 import org.apache.spark.sql.catalyst.expressions.{Empty2Null, Expression, KnownNullable, NamedExpression, SortOrder}
 import org.apache.spark.sql.catalyst.plans.physical.SinglePartition
 import org.apache.spark.sql.execution.{CollectLimitExec, GlobalLimitExec, SparkPlan, TakeOrderedAndProjectExec}
-import org.apache.spark.sql.execution.command.{CreateDataSourceTableAsSelectCommand, DataWritingCommand, RunnableCommand}
-import org.apache.spark.sql.execution.datasources.{GpuWriteFilesMeta, WriteFilesExec}
+import org.apache.spark.sql.execution.command.{DataWritingCommand, RunnableCommand}
 import org.apache.spark.sql.execution.exchange.ENSURE_REQUIREMENTS
 import org.apache.spark.sql.rapids.GpuElementAtMeta
 import org.apache.spark.sql.rapids.GpuV1WriteUtils.GpuEmpty2Null
@@ -121,19 +120,11 @@ trait Spark340PlusNonDBShims extends Spark331PlusNonDBShims {
       }
     ).disabledByDefault("Collect Limit replacement can be slower on the GPU, if huge number " +
         "of rows in a batch it could help by limiting the number of rows transferred from " +
-        "GPU to CPU"),
-    GpuOverrides.exec[WriteFilesExec](
-      "v1 write files",
-      // WriteFilesExec always has patterns:
-      //   InsertIntoHadoopFsRelationCommand(WriteFilesExec) or InsertIntoHiveTable(WriteFilesExec)
-      // The parent node of `WriteFilesExec` will check the types, here just let type check pass
-      ExecChecks(TypeSig.all, TypeSig.all),
-      (write, conf, p, r) => new GpuWriteFilesMeta(write, conf, p, r)
-    )
+        "GPU to CPU")
   ).map(r => (r.getClassFor.asSubclass(classOf[SparkPlan]), r)).toMap
 
   override def getExecs: Map[Class[_ <: SparkPlan], ExecRule[_ <: SparkPlan]] =
-    super.getExecs ++ shimExecs
+    super.getExecs ++ shimExecs ++ WriteFilesExecRule.execs
 
   // AnsiCast is removed from Spark3.4.0
   override def ansiCastRule: ExprRule[_ <: Expression] = null
@@ -173,8 +164,8 @@ trait Spark340PlusNonDBShims extends Spark331PlusNonDBShims {
   override def getRunnableCmds: Map[Class[_ <: RunnableCommand],
       RunnableCommandRule[_ <: RunnableCommand]] = {
     Seq(
-      GpuOverrides.runnableCmd[CreateDataSourceTableAsSelectCommand](
-        "Write to a data source",
+      GpuOverrides.runnableCmdFromShim(
+        CreateDataSourceTableAsSelectRules.runnableCmd,
         (a, conf, p, r) => new CreateDataSourceTableAsSelectCommandMeta(a, conf, p, r))
     ).map(r => (r.getClassFor.asSubclass(classOf[RunnableCommand]), r)).toMap
   }
diff --git a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala b/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala
index 4bf7215e2a0..b9966a7840a 100644
--- a/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala
+++ b/sql-plugin/src/main/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIterator.scala
@@ -49,7 +49,6 @@ import com.nvidia.spark.rapids.ScalableTaskCompletion.onTaskCompletion
 import com.nvidia.spark.rapids.jni.RmmSpark
 
 import org.apache.spark.TaskContext
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.rapids.{RapidsShuffleFetchFailedException, RapidsShuffleTimeoutException}
 import org.apache.spark.sql.rapids.{GpuShuffleEnv, ShuffleMetricsUpdater}
 import org.apache.spark.sql.types.DataType
@@ -81,8 +80,33 @@ class RapidsShuffleIterator(
     taskAttemptId: Long,
     catalog: ShuffleReceivedBufferCatalog = GpuShuffleEnv.getReceivedCatalog,
     timeoutSeconds: Long = GpuShuffleEnv.shuffleFetchTimeoutSeconds)
-  extends Iterator[ColumnarBatch]
-    with Logging {
+  extends Iterator[ColumnarBatch] {
+  private[this] val log = org.slf4j.LoggerFactory.getLogger(getClass)
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
+  private def logWarning(msg: => String): Unit = {
+    if (log.isWarnEnabled) {
+      log.warn(msg)
+    }
+  }
+
+  private def logError(msg: => String): Unit = {
+    if (log.isErrorEnabled) {
+      log.error(msg)
+    }
+  }
+
 
   /**
    * General trait encapsulating either a buffer or an error. Used to hand off batches
diff --git a/sql-plugin/src/main/spark340/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala b/sql-plugin/src/main/spark340/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala
index 913857c871f..97945e42523 100644
--- a/sql-plugin/src/main/spark340/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala
+++ b/sql-plugin/src/main/spark340/scala/org/apache/spark/sql/rapids/RapidsCachingReader.scala
@@ -46,7 +46,6 @@ import com.nvidia.spark.rapids._
 import com.nvidia.spark.rapids.shuffle.{RapidsShuffleIterator, RapidsShuffleTransport}
 
 import org.apache.spark.{InterruptibleIterator, TaskContext}
-import org.apache.spark.internal.Logging
 import org.apache.spark.shuffle.{ShuffleReader, ShuffleReadMetricsReporter}
 import org.apache.spark.sql.types.DataType
 import org.apache.spark.sql.vectorized.ColumnarBatch
@@ -79,7 +78,21 @@ class RapidsCachingReader[K, C](
     transport: Option[RapidsShuffleTransport],
     catalog: ShuffleBufferCatalog,
     sparkTypes: Array[DataType])
-  extends ShuffleReader[K, C] with Logging {
+  extends ShuffleReader[K, C] {
+  private[this] val log = org.slf4j.LoggerFactory.getLogger(getClass)
+
+  private def logInfo(msg: => String): Unit = {
+    if (log.isInfoEnabled) {
+      log.info(msg)
+    }
+  }
+
+  private def logDebug(msg: => String): Unit = {
+    if (log.isDebugEnabled) {
+      log.debug(msg)
+    }
+  }
+
 
   override def read(): Iterator[Product2[K, C]] = {
     NvtxRegistry.RAPIDS_CACHING_READER_READ.push()
diff --git a/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/GpuWindowGroupLimitExec.scala b/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/GpuWindowGroupLimitExec.scala
index e385fee8a63..aa09c29cd2a 100644
--- a/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/GpuWindowGroupLimitExec.scala
+++ b/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/GpuWindowGroupLimitExec.scala
@@ -41,7 +41,6 @@ import com.nvidia.spark.rapids.Arm.withResource
 import com.nvidia.spark.rapids.RmmRapidsRetryIterator.{splitSpillableInHalfByRows, withRetry}
 import com.nvidia.spark.rapids.window.{GpuDenseRank, GpuRank, GpuRowNumber}
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.rdd.RDD
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Alias, And, Attribute, AttributeReference, DenseRank, EqualTo, Expression, GreaterThan, GreaterThanOrEqual, LessThan, LessThanOrEqual, Literal, NamedExpression, Rank, RowNumber, SortOrder, WindowExpression, WindowSpecDefinition}
@@ -260,8 +259,7 @@ class GpuWindowGroupLimitingIterator(input: Iterator[ColumnarBatch],
                                      limit: Int,
                                      numOutputBatches: GpuMetric,
                                      numOutputRows: GpuMetric)
-  extends Iterator[ColumnarBatch]
-  with Logging {
+  extends Iterator[ColumnarBatch] {
 
   override def hasNext: Boolean = input.hasNext
 
diff --git a/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/Spark341PlusDBShims.scala b/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/Spark341PlusDBShims.scala
index 501e4f3c6c7..224d7c6b0a2 100644
--- a/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/Spark341PlusDBShims.scala
+++ b/sql-plugin/src/main/spark341db/scala/com/nvidia/spark/rapids/shims/Spark341PlusDBShims.scala
@@ -79,7 +79,7 @@ trait Spark341PlusDBShims extends Spark332PlusDBShims {
           // plugin is also an union of all the types of Pandas UDF.
           (TypeSig.commonCudfTypes + TypeSig.ARRAY).nested() + TypeSig.STRUCT,
           TypeSig.unionOfPandasUdfOut,
-          repeatingParamCheck = Some(RepeatingParamCheck(
+          repeatingParamCheck = Some(new RepeatingParamCheck(
             "param",
             (TypeSig.commonCudfTypes + TypeSig.ARRAY + TypeSig.STRUCT).nested(),
             TypeSig.all))),
diff --git a/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuArrowPythonRunner.scala b/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuArrowPythonRunner.scala
index 6ffa0abab53..77ee3005330 100644
--- a/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuArrowPythonRunner.scala
+++ b/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuArrowPythonRunner.scala
@@ -35,6 +35,23 @@ import org.apache.spark.sql.rapids.shims.ArrowUtilsShim
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
+// Keep executable line numbers aligned with pre-Spark-4 shims for binary-dedupe.
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
 /**
  * Similar to `PythonUDFRunner`, but exchange data with Python worker via Arrow stream.
  */
diff --git a/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuCoGroupedArrowPythonRunner.scala b/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuCoGroupedArrowPythonRunner.scala
index e665435eb25..dba5900e25c 100644
--- a/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuCoGroupedArrowPythonRunner.scala
+++ b/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuCoGroupedArrowPythonRunner.scala
@@ -36,6 +36,22 @@ import org.apache.spark.sql.rapids.execution.python.{GpuArrowWriter, GpuPythonRu
 import org.apache.spark.sql.types.StructType
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
+// Keep executable line numbers aligned with pre-Spark-4 shims for binary-dedupe.
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
 /**
  * Python UDF Runner for cogrouped UDFs, designed for `GpuFlatMapCoGroupsInPandasExec` only.
  *
diff --git a/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala b/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
index ea75745de6c..5b802ae838b 100644
--- a/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
+++ b/sql-plugin/src/main/spark341db/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
@@ -26,14 +26,14 @@ import org.apache.spark.sql.rapids.shims.ArrowUtilsShim
 import org.apache.spark.sql.types._
 import org.apache.spark.sql.vectorized.ColumnarBatch
 
-case class GpuGroupedPythonRunnerFactory(
+class GpuGroupedPythonRunnerFactory(
   conf: org.apache.spark.sql.internal.SQLConf,
   chainedFunc: Seq[(ChainedPythonFunctions, Long)],
   argOffsets: Array[Array[Int]],
   dedupAttrs: StructType,
   pythonOutputSchema: StructType,
   evalType: Int,
-  argNames: Option[Array[Array[Option[String]]]] = None) {
+  argNames: Option[Array[Array[Option[String]]]]) extends Serializable {
   // Configs from DB runtime
   val maxBytes = conf.pandasZeroConfConversionGroupbyApplyMaxBytesPerSlice
   val zeroConfEnabled = conf.pandasZeroConfConversionGroupbyApplyEnabled
diff --git a/sql-plugin/src/main/spark342/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala b/sql-plugin/src/main/spark342/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala
deleted file mode 100644
index 82c3aa73acf..00000000000
--- a/sql-plugin/src/main/spark342/scala/com/nvidia/spark/rapids/shims/DecimalMultiply128.scala
+++ /dev/null
@@ -1,51 +0,0 @@
-/*
- * Copyright (c) 2023-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "342"}
-{"spark": "343"}
-{"spark": "344"}
-{"spark": "350db143"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-{"spark": "400"}
-{"spark": "400db173"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
-
-import ai.rapids.cudf.{ColumnView, Table}
-import com.nvidia.spark.rapids.jni.DecimalUtils._
-
-object DecimalMultiply128{
-  def apply(castLhs: ColumnView, castRhs: ColumnView, scale: Int): Table = {
-    /**
-     * Calling the version of multiplying 128-bit decimal numbers that casts the result only once
-     * to the final precision and scale.
-     * This version of multiplying 128-bit decimal numbers should only be used with Spark versions
-     * greater than or equal to 3.4.2, 4.0.0, 3.5.1
-     */
-    multiply128(castLhs, castRhs, scale, false)
-  }
-}
diff --git a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala b/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala
index a3220b961cf..f3e4b8f3666 100644
--- a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala
+++ b/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/LegacyBehaviorPolicyShim.scala
@@ -33,13 +33,13 @@
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
-import org.apache.spark.sql.internal.{LegacyBehaviorPolicy, SQLConf}
+import org.apache.spark.sql.internal.SQLConf
 
 object LegacyBehaviorPolicyShim {
-  val CORRECTED_STR: String = LegacyBehaviorPolicy.CORRECTED.toString
-  val EXCEPTION_STR: String = LegacyBehaviorPolicy.EXCEPTION.toString
+  val CORRECTED_STR: String = "CORRECTED"
+  val EXCEPTION_STR: String = "EXCEPTION"
 
   def isLegacyTimeParserPolicy(): Boolean = {
-    SQLConf.get.legacyTimeParserPolicy == LegacyBehaviorPolicy.LEGACY
+    SQLConf.get.legacyTimeParserPolicy.toString == "LEGACY"
   }
 }
diff --git a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala b/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala
index 319964ee6e9..943e2dd3705 100644
--- a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala
+++ b/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/NullOutputStreamShim.scala
@@ -33,8 +33,11 @@
 spark-rapids-shim-json-lines ***/
 package com.nvidia.spark.rapids.shims
 
-import org.apache.commons.io.output.NullOutputStream
+import java.io.OutputStream
 
 object NullOutputStreamShim {
-  def INSTANCE = NullOutputStream.INSTANCE
+  val INSTANCE: OutputStream = new OutputStream {
+    override def write(b: Int): Unit = {}
+    override def write(b: Array[Byte], off: Int, len: Int): Unit = {}
+  }
 }
diff --git a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala b/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala
deleted file mode 100644
index 1993e5fe4dd..00000000000
--- a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/ReplaceDataExecShim.scala
+++ /dev/null
@@ -1,41 +0,0 @@
-/*
- * Copyright (c) 2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-/*** spark-rapids-shim-json-lines
-{"spark": "350"}
-{"spark": "351"}
-{"spark": "352"}
-{"spark": "353"}
-{"spark": "354"}
-{"spark": "355"}
-{"spark": "356"}
-{"spark": "357"}
-{"spark": "358"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
-
-import com.nvidia.spark.rapids.{GpuExec, GpuWrite}
-
-import org.apache.spark.sql.execution.SparkPlan
-import org.apache.spark.sql.execution.datasources.v2.{GpuReplaceDataExec, ReplaceDataExec}
-
-object ReplaceDataExecShim {
-  def convertToGpu(
-      cpuExec: ReplaceDataExec,
-      childPlan: SparkPlan,
-      gpuWrite: GpuWrite): GpuExec = {
-    GpuReplaceDataExec(childPlan, cpuExec.refreshCache, gpuWrite)
-  }
-}
diff --git a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/Spark350PlusNonDBShims.scala b/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/Spark350PlusNonDBShims.scala
index 9af31e67b91..bb6beb5ef1c 100644
--- a/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/Spark350PlusNonDBShims.scala
+++ b/sql-plugin/src/main/spark350/scala/com/nvidia/spark/rapids/shims/Spark350PlusNonDBShims.scala
@@ -130,7 +130,7 @@ trait Spark350PlusNonDBShims extends Spark340PlusNonDBShims {
           // plugin is also an union of all the types of Pandas UDF.
           (TypeSig.commonCudfTypes + TypeSig.ARRAY).nested() + TypeSig.STRUCT,
           TypeSig.unionOfPandasUdfOut,
-          repeatingParamCheck = Some(RepeatingParamCheck(
+          repeatingParamCheck = Some(new RepeatingParamCheck(
             "param",
             (TypeSig.commonCudfTypes + TypeSig.ARRAY + TypeSig.STRUCT).nested(),
             TypeSig.all))),
@@ -150,8 +150,8 @@ trait Spark350PlusNonDBShims extends Spark340PlusNonDBShims {
         ExprChecks.projectOnly(
           TypeSig.all,
           TypeSig.all,
-          Seq(ParamCheck("condition", TypeSig.all, TypeSig.all)),
-          Some(RepeatingParamCheck("outputs", TypeSig.all, TypeSig.all))
+          Seq(new ParamCheck("condition", TypeSig.all, TypeSig.all)),
+          Some(new RepeatingParamCheck("outputs", TypeSig.all, TypeSig.all))
         ),
         (keep, conf, p, r) => new GpuKeepInstructionMeta(keep, conf, p, r)),
       GpuOverrides.expr[Discard](
@@ -159,15 +159,15 @@ trait Spark350PlusNonDBShims extends Spark340PlusNonDBShims {
         ExprChecks.projectOnly(
           TypeSig.all,
           TypeSig.all,
-          Seq(ParamCheck("condition", TypeSig.all, TypeSig.all))),
+          Seq(new ParamCheck("condition", TypeSig.all, TypeSig.all))),
         (discard, conf, p, r) => new GpuDiscardInstructionMeta(discard, conf, p, r)),
       GpuOverrides.expr[Split](
         "Split instruction for MERGE operations - splits rows into multiple outputs",
         ExprChecks.projectOnly(
           TypeSig.all,
           TypeSig.all,
-          Seq(ParamCheck("condition", TypeSig.all, TypeSig.all)),
-          Some(RepeatingParamCheck("outputs", TypeSig.all, TypeSig.all))),
+          Seq(new ParamCheck("condition", TypeSig.all, TypeSig.all)),
+          Some(new RepeatingParamCheck("outputs", TypeSig.all, TypeSig.all))),
         (split, conf, p, r) => new GpuSplitInstructionMeta(split, conf, p, r))
     ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
     super.getExprs ++ shimExprs
diff --git a/sql-plugin/src/main/spark350db143/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentsUtils.scala b/sql-plugin/src/main/spark350db143/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentsUtils.scala
index f67afdd0015..d735fbf14f7 100644
--- a/sql-plugin/src/main/spark350db143/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentsUtils.scala
+++ b/sql-plugin/src/main/spark350db143/scala/org/apache/spark/sql/rapids/execution/python/shims/PythonArgumentsUtils.scala
@@ -48,15 +48,15 @@ object PythonArgumentUtils {
             (None, e)
         }
         if (allInputs.exists(_.semanticEquals(value))) {
-          GpuArgumentMeta(allInputs.indexWhere(_.semanticEquals(value)), key)
+          new GpuArgumentMeta(allInputs.indexWhere(_.semanticEquals(value)), key)
         } else {
           allInputs += value
           dataTypes += value.dataType
-          GpuArgumentMeta(allInputs.length - 1, key)
+          new GpuArgumentMeta(allInputs.length - 1, key)
         }
       }.toArray
     }.toArray
-    GpuPythonArguments(allInputs.toSeq, dataTypes.toSeq,
+    new GpuPythonArguments(allInputs.toSeq, dataTypes.toSeq,
       argMetas.map(_.map(_.offset)), Some(argMetas.map(_.map(_.name))))
   }
 }
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/CudfUnsafeRow.scala b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/CudfUnsafeRow.scala
index ddc8f77b162..d6fd8f120b8 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/CudfUnsafeRow.scala
+++ b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/CudfUnsafeRow.scala
@@ -40,4 +40,9 @@ final class CudfUnsafeRow(
   }
 }
 
+// Keep companion line metadata aligned with pre-Spark-4 shims for binary-dedupe.
+
+
+
+
 object CudfUnsafeRow extends CudfUnsafeRowTrait
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader.scala b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader.scala
index 6bd9f9c99ae..1616a6b39b9 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader.scala
+++ b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/GpuOrcDataReader.scala
@@ -36,6 +36,19 @@ class GpuOrcDataReader(
 }
 
 
+// Keep executable line numbers aligned with pre-Spark-4 shims for binary-dedupe.
+
+
+
+
+
+
+
+
+
+
+
+
 object GpuOrcDataReader {
   // File cache is being used, so we want read ranges that can be cached separately
   val shouldMergeDiskRanges: Boolean = false
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/LogicalPlanShims.scala b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/LogicalPlanShims.scala
index f31ca918539..0eaa55f0c6c 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/LogicalPlanShims.scala
+++ b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/LogicalPlanShims.scala
@@ -26,6 +26,18 @@ package com.nvidia.spark.rapids.shims
 import org.apache.spark.sql.catalyst.plans.logical.LogicalPlan
 import org.apache.spark.sql.execution.datasources.{FileIndex, HadoopFsRelation, LogicalRelationWithTable}
 
+// Keep companion line metadata aligned with pre-Spark-4 shims for binary-dedupe.
+
+
+
+
+
+
+
+
+
+
+
 object LogicalPlanShims {
   def getLocations(plan: LogicalPlan): Seq[FileIndex] = plan.collect {
     case LogicalRelationWithTable(t: HadoopFsRelation, _) => t.location
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala
index 842846d6aae..bd6c0e791c0 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala
+++ b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/NullIntolerantShim.scala
@@ -28,3 +28,24 @@ import org.apache.spark.sql.catalyst.expressions.Expression
 trait NullIntolerantShim extends Expression {
   override def nullIntolerant: Boolean = true
 }
+
+abstract class GpuLiteralShim extends com.nvidia.spark.rapids.GpuLeafExpression {
+  def value: Any
+  def dataType: org.apache.spark.sql.types.DataType
+
+  override protected def jsonFields: List[org.json4s.JsonAST.JField] = {
+    val jsonValue = (value, dataType) match {
+      case (null, _) => org.json4s.JsonAST.JNull
+      case (i: Int, org.apache.spark.sql.types.DateType) =>
+        org.json4s.JsonAST.JString(
+          org.apache.spark.sql.catalyst.util.DateTimeUtils.toJavaDate(i).toString)
+      case (l: Long, org.apache.spark.sql.types.TimestampType) =>
+        org.json4s.JsonAST.JString(
+          org.apache.spark.sql.catalyst.util.DateTimeUtils.toJavaTimestamp(l).toString)
+      case (other, _) => org.json4s.JsonAST.JString(other.toString)
+    }
+    ("value" -> jsonValue) ::
+      ("dataType" -> org.apache.spark.sql.rapids.execution.TrampolineUtil.jsonValue(dataType)
+        .asInstanceOf[org.json4s.JsonAST.JValue]) :: Nil
+  }
+}
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala
new file mode 100644
index 00000000000..837aa287a8f
--- /dev/null
+++ b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala
@@ -0,0 +1,54 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*** spark-rapids-shim-json-lines
+{"spark": "400"}
+{"spark": "400db173"}
+{"spark": "401"}
+{"spark": "402"}
+spark-rapids-shim-json-lines ***/
+package com.nvidia.spark.rapids.shims
+
+import org.apache.spark.sql.catalyst.expressions.Predicate
+
+trait ShimPredicate extends Predicate {
+  def contextIndependentFoldable: Boolean = children.forall(_.foldable)
+}
+
+trait ShimDataWritingCommand
+    extends org.apache.spark.sql.execution.command.DataWritingCommand
+    with ShimUnaryCommand {
+  def runColumnar(
+      sparkSession: org.apache.spark.sql.classic.SparkSession,
+      child: org.apache.spark.sql.execution.SparkPlan):
+      Seq[org.apache.spark.sql.vectorized.ColumnarBatch]
+
+  def runColumnarFromAny(
+      sparkSession: AnyRef,
+      child: org.apache.spark.sql.execution.SparkPlan):
+      Seq[org.apache.spark.sql.vectorized.ColumnarBatch] = {
+    runColumnar(sparkSession.asInstanceOf[org.apache.spark.sql.classic.SparkSession], child)
+  }
+
+  override def run(
+      sparkSession: org.apache.spark.sql.classic.SparkSession,
+      child: org.apache.spark.sql.execution.SparkPlan): Seq[org.apache.spark.sql.Row] = {
+    com.nvidia.spark.rapids.Arm.withResource(runColumnar(sparkSession, child)) { batches =>
+      assert(batches.isEmpty)
+    }
+    Seq.empty[org.apache.spark.sql.Row]
+  }
+}
diff --git a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/Spark400PlusCommonShims.scala b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/Spark400PlusCommonShims.scala
index d3f63a943a1..72a8bbc2f38 100644
--- a/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/Spark400PlusCommonShims.scala
+++ b/sql-plugin/src/main/spark400/scala/com/nvidia/spark/rapids/shims/Spark400PlusCommonShims.scala
@@ -40,7 +40,7 @@ trait Spark400PlusCommonShims extends Spark350PlusNonDBShims {
           "And(GreaterThanOrEqual(ref, lower), LessThanOrEqual(ref, upper);  StructToJson is " +
           "replaced by Invoke(Literal(StructsToJsonEvaluator), evaluate, string_type, arguments)",
         InvokeCheck,
-        InvokeExprMeta)
+        (invoke, conf, p, r) => new InvokeExprMeta(invoke, conf, p, r))
         .note("The supported types are not deterministic since it's a dynamic expression")
     ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
     super.getExprs ++ shimExprs
diff --git a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala b/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala
deleted file mode 100644
index f3f48170060..00000000000
--- a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/nvidia/DFUDFShims.scala
+++ /dev/null
@@ -1,33 +0,0 @@
-/*
- * Copyright (c) 2024-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "400"}
-{"spark": "400db173"}
-{"spark": "401"}
-{"spark": "402"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
-package org.apache.spark.sql.nvidia
-
-import org.apache.spark.sql.Column
-import org.apache.spark.sql.catalyst.expressions.Expression
-import org.apache.spark.sql.classic.{ColumnNodeToExpressionConverter, ExpressionUtils}
-
-object DFUDFShims {
-  def columnToExpr(c: Column): Expression = ColumnNodeToExpressionConverter(c.node)
-  def exprToColumn(e: Expression): Column = ExpressionUtils.column(e)
-}
diff --git a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/InvokeExprMeta.scala b/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/InvokeExprMeta.scala
index d66e879667a..4cb2c60811d 100644
--- a/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/InvokeExprMeta.scala
+++ b/sql-plugin/src/main/spark400/scala/org/apache/spark/sql/rapids/shims/InvokeExprMeta.scala
@@ -33,7 +33,7 @@ import org.apache.spark.sql.catalyst.expressions.url.ParseUrlEvaluator
 import org.apache.spark.sql.rapids.{GpuParseUrl, GpuStructsToJson}
 import org.apache.spark.sql.types._
 
-case class InvokeExprMeta(
+class InvokeExprMeta(
     invoke: Invoke,
     override val conf: RapidsConf,
     p: Option[RapidsMeta[_, _, _]],
diff --git a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala
deleted file mode 100644
index aa957363b62..00000000000
--- a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/DayTimeIntervalShims.scala
+++ /dev/null
@@ -1,105 +0,0 @@
-/*
- * Copyright (c) 2022-2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "400db173"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
-
-import com.nvidia.spark.rapids._
-
-import org.apache.spark.sql.catalyst.expressions._
-import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.rapids._
-import org.apache.spark.sql.rapids.shims.{GpuDivideDTInterval, GpuMultiplyDTInterval,
-  GpuTimestampAddInterval}
-import org.apache.spark.sql.types.{CalendarIntervalType, DayTimeIntervalType}
-import org.apache.spark.unsafe.types.CalendarInterval
-
-/**
- * DayTimeInterval shims for Spark 4.1.1+
- * TimeAdd was renamed to TimestampAddInterval in Spark 4.1.0
- */
-object DayTimeIntervalShims {
-  def exprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = Seq(
-    GpuOverrides.expr[Abs](
-      "Absolute value",
-      ExprChecks.unaryProjectAndAstInputMatchesOutput(
-        TypeSig.implicitCastsAstTypes,
-        TypeSig.gpuNumeric + GpuTypeShims.additionalArithmeticSupportedTypes,
-        TypeSig.cpuNumeric + GpuTypeShims.additionalArithmeticSupportedTypes),
-      (a, conf, p, r) => new UnaryAstExprMeta[Abs](a, conf, p, r) {
-        val ansiEnabled = SQLConf.get.ansiEnabled
-
-        override def tagSelfForAst(): Unit = {
-          if (ansiEnabled && GpuAnsi.needBasicOpOverflowCheck(a.dataType)) {
-            willNotWorkInAst("AST unary minus does not support ANSI mode.")
-          }
-        }
-
-        // ANSI support for ABS was added in 3.2.0 SPARK-33275
-        override def convertToGpu(child: Expression): GpuExpression = GpuAbs(child, ansiEnabled)
-      }),
-    GpuOverrides.expr[MultiplyDTInterval](
-      "Day-time interval * number",
-      ExprChecks.binaryProject(
-        TypeSig.DAYTIME,
-        TypeSig.DAYTIME,
-        ("lhs", TypeSig.DAYTIME, TypeSig.DAYTIME),
-        ("rhs", TypeSig.gpuNumeric - TypeSig.DECIMAL_128, TypeSig.gpuNumeric)),
-      (a, conf, p, r) => new BinaryExprMeta[MultiplyDTInterval](a, conf, p, r) {
-        override def convertToGpu(lhs: Expression, rhs: Expression): GpuExpression =
-          GpuMultiplyDTInterval(lhs, rhs)
-      }),
-    GpuOverrides.expr[DivideDTInterval](
-      "Day-time interval / number",
-      ExprChecks.binaryProject(
-        TypeSig.DAYTIME,
-        TypeSig.DAYTIME,
-        ("lhs", TypeSig.DAYTIME, TypeSig.DAYTIME),
-        ("rhs", TypeSig.gpuNumeric - TypeSig.DECIMAL_128, TypeSig.gpuNumeric)),
-      (a, conf, p, r) => new BinaryExprMeta[DivideDTInterval](a, conf, p, r) {
-        override def convertToGpu(lhs: Expression, rhs: Expression): GpuExpression =
-          GpuDivideDTInterval(lhs, rhs)
-      }),
-    GpuOverrides.expr[TimestampAddInterval](
-      "Adds interval to timestamp",
-      ExprChecks.binaryProject(TypeSig.TIMESTAMP, TypeSig.TIMESTAMP,
-        ("start", TypeSig.TIMESTAMP, TypeSig.TIMESTAMP),
-        // interval support DAYTIME column or CALENDAR literal
-        ("interval", TypeSig.DAYTIME + TypeSig.lit(TypeEnum.CALENDAR)
-            .withPsNote(TypeEnum.CALENDAR, "month intervals are not supported"),
-            TypeSig.DAYTIME + TypeSig.CALENDAR)),
-      (timeAdd, conf, p, r) => new BinaryExprMeta[TimestampAddInterval](timeAdd, conf, p, r) {
-        override def tagExprForGpu(): Unit = {
-          GpuOverrides.extractLit(timeAdd.interval).foreach { lit =>
-            lit.dataType match {
-              case CalendarIntervalType =>
-                val intvl = lit.value.asInstanceOf[CalendarInterval]
-                if (intvl.months != 0) {
-                  willNotWorkOnGpu("interval months isn't supported")
-                }
-              case _: DayTimeIntervalType => // Supported
-            }
-          }
-        }
-
-        override def convertToGpu(lhs: Expression, rhs: Expression): GpuExpression =
-          GpuTimestampAddInterval(lhs, rhs)
-      })
-  ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
-}
diff --git a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/Spark400PlusDBShims.scala b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/Spark400PlusDBShims.scala
index 2b443be563c..22c37269c9b 100644
--- a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/Spark400PlusDBShims.scala
+++ b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/Spark400PlusDBShims.scala
@@ -35,7 +35,7 @@ trait Spark400PlusDBShims extends Spark341PlusDBShims {
           "And(GreaterThanOrEqual(ref, lower), LessThanOrEqual(ref, upper);  StructToJson is " +
           "replaced by Invoke(Literal(StructsToJsonEvaluator), evaluate, string_type, arguments)",
         InvokeCheck,
-        InvokeExprMeta)
+        (invoke, conf, p, r) => new InvokeExprMeta(invoke, conf, p, r))
         .note("The supported types are not deterministic since it's a dynamic expression")
     ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
     super.getExprs ++ shimExprs
diff --git a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/SparkShims.scala b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
index 4f2994f1044..8d50f882110 100644
--- a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
+++ b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
@@ -43,12 +43,12 @@ object SparkShimImpl extends Spark400PlusDBShims {
       GpuOverrides.expr[CollationAwareMurmur3Hash](
         "Collation-aware murmur3 hash operator",
         HashExprChecks.murmur3ProjectChecks,
-        Murmur3HashExprMeta.apply
+        ((expr, conf, parent, rule) => new Murmur3HashExprMeta(expr, conf, parent, rule))
       ),
       GpuOverrides.expr[CollationAwareXxHash64](
         "Collation-aware xxhash64 operator",
         HashExprChecks.xxhash64ProjectChecks,
-        XxHash64ExprMeta.apply
+        ((expr, conf, parent, rule) => new XxHash64ExprMeta(expr, conf, parent, rule))
       )
     ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
     super.getExprs ++ shimExprs
diff --git a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/TimeAddShims.scala b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/TimeAddShims.scala
index 83d9298bfa2..5163eb14680 100644
--- a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/TimeAddShims.scala
+++ b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/TimeAddShims.scala
@@ -22,12 +22,40 @@ package com.nvidia.spark.rapids.shims
 
 import com.nvidia.spark.rapids._
 
-import org.apache.spark.sql.catalyst.expressions.Expression
+import org.apache.spark.sql.catalyst.expressions.{Expression, TimestampAddInterval}
+import org.apache.spark.sql.rapids.shims.GpuTimestampAddInterval
+import org.apache.spark.sql.types.{CalendarIntervalType, DayTimeIntervalType}
+import org.apache.spark.unsafe.types.CalendarInterval
 
 /**
- * Empty TimeAddShims for Spark 4.1.0+ and Databricks 17.3.
- * TimeAdd was renamed to TimestampAddInterval and is handled by DayTimeIntervalShims.
+ * TimestampAddInterval support for Spark 4.1.0+ and Databricks 17.3.
+ * TimeAdd was renamed to TimestampAddInterval in Spark 4.1.
  */
 object TimeAddShims {
-  val exprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = Map.empty
+  val exprs: Map[Class[_ <: Expression], ExprRule[_ <: Expression]] = Seq(
+    GpuOverrides.expr[TimestampAddInterval](
+      "Adds interval to timestamp",
+      ExprChecks.binaryProject(TypeSig.TIMESTAMP, TypeSig.TIMESTAMP,
+        ("start", TypeSig.TIMESTAMP, TypeSig.TIMESTAMP),
+        ("interval", TypeSig.DAYTIME + TypeSig.lit(TypeEnum.CALENDAR)
+            .withPsNote(TypeEnum.CALENDAR, "month intervals are not supported"),
+            TypeSig.DAYTIME + TypeSig.CALENDAR)),
+      (timeAdd, conf, p, r) => new BinaryExprMeta[TimestampAddInterval](timeAdd, conf, p, r) {
+        override def tagExprForGpu(): Unit = {
+          GpuOverrides.extractLit(timeAdd.interval).foreach { lit =>
+            lit.dataType match {
+              case CalendarIntervalType =>
+                val intvl = lit.value.asInstanceOf[CalendarInterval]
+                if (intvl.months != 0) {
+                  willNotWorkOnGpu("interval months isn't supported")
+                }
+              case _: DayTimeIntervalType =>
+            }
+          }
+        }
+
+        override def convertToGpu(lhs: Expression, rhs: Expression): GpuExpression =
+          GpuTimestampAddInterval(lhs, rhs)
+      })
+  ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
 }
diff --git a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala b/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
deleted file mode 100644
index 9d155cecb91..00000000000
--- a/sql-plugin/src/main/spark400db173/scala/com/nvidia/spark/rapids/shims/TryModeShim.scala
+++ /dev/null
@@ -1,45 +0,0 @@
-/*
- * Copyright (c) 2026, NVIDIA CORPORATION.
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-/*** spark-rapids-shim-json-lines
-{"spark": "400db173"}
-{"spark": "411"}
-spark-rapids-shim-json-lines ***/
-package com.nvidia.spark.rapids.shims
-
-import org.apache.spark.sql.catalyst.expressions.{Add, Divide, EvalMode, Expression, Multiply, Remainder, Subtract}
-import org.apache.spark.sql.catalyst.expressions.aggregate.{Average, Sum}
-
-/**
- * Spark 4.1.0+ and Databricks 17.3 version where evalMode
- * changed to evalContext.evalMode for arithmetic.
- * See: https://github.com/apache/spark/commit/a96e9ca81518bff31b0089d459fe78804ca1aa38
- */
-object TryModeShim {
-  def isTryMode(expr: Expression): Boolean = {
-    val evalMode = expr match {
-      case add: Add => add.evalContext.evalMode
-      case sub: Subtract => sub.evalContext.evalMode
-      case mul: Multiply => mul.evalContext.evalMode
-      case div: Divide => div.evalContext.evalMode
-      case mod: Remainder => mod.evalContext.evalMode
-      case avg: Average => avg.evalMode  // Average still uses evalMode directly as a parameter
-      case sum: Sum => sum.evalContext.evalMode  // Sum uses evalContext.evalMode
-      case _ => throw new RuntimeException(s"Unsupported expression $expr in TRY mode")
-    }
-    evalMode == EvalMode.TRY
-  }
-}
diff --git a/sql-plugin/src/main/spark400db173/scala/org/apache/spark/sql/rapids/execution/python/shims/WindowInPandasExecTypeShim.scala b/sql-plugin/src/main/spark400db173/scala/org/apache/spark/sql/rapids/execution/python/shims/WindowInPandasExecTypeShim.scala
index 8c5ed60a4c0..d8c84ed87aa 100644
--- a/sql-plugin/src/main/spark400db173/scala/org/apache/spark/sql/rapids/execution/python/shims/WindowInPandasExecTypeShim.scala
+++ b/sql-plugin/src/main/spark400db173/scala/org/apache/spark/sql/rapids/execution/python/shims/WindowInPandasExecTypeShim.scala
@@ -22,6 +22,26 @@ package org.apache.spark.sql.rapids.execution.python.shims
 
 import org.apache.spark.sql.execution.python.ArrowWindowPythonExec
 
+// Keep executable line numbers aligned with pre-Spark-4 shims for binary-dedupe.
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
 /**
  * WindowInPandasExec was renamed to ArrowWindowPythonExec in Spark 4.1.0.
  * Use the new class name as the type alias.
diff --git a/sql-plugin/src/main/spark401/scala/com/nvidia/spark/rapids/shims/SparkShims.scala b/sql-plugin/src/main/spark401/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
index 46ac248006c..a2a321c4c2d 100644
--- a/sql-plugin/src/main/spark401/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
+++ b/sql-plugin/src/main/spark401/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
@@ -31,12 +31,12 @@ object SparkShimImpl extends Spark400PlusCommonShims {
       GpuOverrides.expr[CollationAwareMurmur3Hash](
         "Collation-aware murmur3 hash operator",
         HashExprChecks.murmur3ProjectChecks,
-        Murmur3HashExprMeta.apply
+        ((expr, conf, parent, rule) => new Murmur3HashExprMeta(expr, conf, parent, rule))
       ),
       GpuOverrides.expr[CollationAwareXxHash64](
         "Collation-aware xxhash64 operator",
         HashExprChecks.xxhash64ProjectChecks,
-        XxHash64ExprMeta.apply
+        ((expr, conf, parent, rule) => new XxHash64ExprMeta(expr, conf, parent, rule))
       )
     ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
     super.getExprs ++ shimExprs
diff --git a/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala b/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala
new file mode 100644
index 00000000000..1578dfc5c22
--- /dev/null
+++ b/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/ShimPredicate.scala
@@ -0,0 +1,52 @@
+/*
+ * Copyright (c) 2026, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*** spark-rapids-shim-json-lines
+{"spark": "411"}
+spark-rapids-shim-json-lines ***/
+package com.nvidia.spark.rapids.shims
+
+import org.apache.spark.sql.catalyst.expressions.Predicate
+
+trait ShimPredicate extends Predicate {
+  override def contextIndependentFoldable: Boolean =
+    children.forall(_.contextIndependentFoldable)
+}
+
+trait ShimDataWritingCommand
+    extends org.apache.spark.sql.execution.command.DataWritingCommand
+    with ShimUnaryCommand {
+  def runColumnar(
+      sparkSession: org.apache.spark.sql.classic.SparkSession,
+      child: org.apache.spark.sql.execution.SparkPlan):
+      Seq[org.apache.spark.sql.vectorized.ColumnarBatch]
+
+  def runColumnarFromAny(
+      sparkSession: AnyRef,
+      child: org.apache.spark.sql.execution.SparkPlan):
+      Seq[org.apache.spark.sql.vectorized.ColumnarBatch] = {
+    runColumnar(sparkSession.asInstanceOf[org.apache.spark.sql.classic.SparkSession], child)
+  }
+
+  override def run(
+      sparkSession: org.apache.spark.sql.classic.SparkSession,
+      child: org.apache.spark.sql.execution.SparkPlan): Seq[org.apache.spark.sql.Row] = {
+    com.nvidia.spark.rapids.Arm.withResource(runColumnar(sparkSession, child)) { batches =>
+      assert(batches.isEmpty)
+    }
+    Seq.empty[org.apache.spark.sql.Row]
+  }
+}
diff --git a/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/SparkShims.scala b/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
index f3f6c6bb675..dca0bcef176 100644
--- a/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
+++ b/sql-plugin/src/main/spark411/scala/com/nvidia/spark/rapids/shims/SparkShims.scala
@@ -36,12 +36,12 @@ object SparkShimImpl extends Spark400PlusCommonShims with RebaseShims {
       GpuOverrides.expr[CollationAwareMurmur3Hash](
         "Collation-aware murmur3 hash operator",
         HashExprChecks.murmur3ProjectChecks,
-        Murmur3HashExprMeta.apply
+        ((expr, conf, parent, rule) => new Murmur3HashExprMeta(expr, conf, parent, rule))
       ),
       GpuOverrides.expr[CollationAwareXxHash64](
         "Collation-aware xxhash64 operator",
         HashExprChecks.xxhash64ProjectChecks,
-        XxHash64ExprMeta.apply
+        ((expr, conf, parent, rule) => new XxHash64ExprMeta(expr, conf, parent, rule))
       )
     ).map(r => (r.getClassFor.asSubclass(classOf[Expression]), r)).toMap
     // Include TimeAddShims for TimestampAddInterval support in 4.1.0
diff --git a/sql-plugin/src/main/spark411/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala b/sql-plugin/src/main/spark411/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
index e51f5bc5b42..9d04faddd95 100644
--- a/sql-plugin/src/main/spark411/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
+++ b/sql-plugin/src/main/spark411/scala/org/apache/spark/sql/rapids/execution/python/shims/GpuGroupedPythonRunnerFactory.scala
@@ -34,14 +34,14 @@ import org.apache.spark.sql.vectorized.ColumnarBatch
  *   - Create new Arrow stream for each batch
  *   - Send 0 to indicate end of data
  */
-case class GpuGroupedPythonRunnerFactory(
+class GpuGroupedPythonRunnerFactory(
     conf: org.apache.spark.sql.internal.SQLConf,
     chainedFunc: Seq[(ChainedPythonFunctions, Long)],
     argOffsets: Array[Array[Int]],
     dedupAttrs: StructType,
     pythonOutputSchema: StructType,
     evalType: Int,
-    argNames: Option[Array[Array[Option[String]]]] = None) {
+    argNames: Option[Array[Array[Option[String]]]]) extends Serializable {
   val sessionLocalTimeZone = conf.sessionLocalTimeZone
   val pythonRunnerConf = ArrowUtilsShim.getPythonRunnerConfMap(conf)
 
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/DumpUtilsSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/DumpUtilsSuite.scala
index 5c6d0fbe634..8bd42e8153c 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/DumpUtilsSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/DumpUtilsSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -120,7 +120,7 @@ class DumpUtilsSuite extends AnyFunSuite with BeforeAndAfterAll {
         val header = headerOptional.get()
         val buffer = HostMemoryBuffer.allocate(header.getTotalDataLen())
         buffer.copyFromStream(0, din, header.getTotalDataLen())
-        val spillableKudoTable = SpillableKudoTable(header, buffer)
+        val spillableKudoTable = SpillableKudoTable.from(header, buffer)
         withResource(new KudoSerializedTableColumn(spillableKudoTable)) { column =>
           val batch = new ColumnarBatch(Array(column.asInstanceOf[GpuColumnVectorBase]),
             spillableKudoTable.header.getNumRows)
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesRetrySuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesRetrySuite.scala
index c42089daf25..bb13a1639f3 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesRetrySuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesRetrySuite.scala
@@ -310,7 +310,7 @@ class GpuCoalesceBatchesRetrySuite
         NoopMetric,
         NoopMetric,
         "test",
-        TableCompressionCodecConfig(1024, 1024)) with CoalesceIteratorMocks {
+        new TableCompressionCodecConfig(1024, 1024)) with CoalesceIteratorMocks {
     override def populateCandidateBatches(): Boolean = {
       val lastBatchTag = super.populateCandidateBatches()
       injectError(injectRetry, injectSplitAndRetry)
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesSuite.scala
index 20919d171d4..07694c99d23 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/GpuCoalesceBatchesSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -657,7 +657,7 @@ class GpuCoalesceBatchesSuite extends SparkQueryCompareTestSuite {
     withResource(codec.createBatchCompressor(0, Cuda.DEFAULT_STREAM)) { compressor =>
       compressor.addTableToCompress(buildContiguousTable(start, numRows))
       withResource(compressor.finish()) { compressed =>
-        GpuCompressedColumnVector.from(compressed.head)
+        GpuCompressedColumnVector.from(compressed.head.buffer, compressed.head.meta)
       }
     }
   }
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/GpuSemaphoreSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/GpuSemaphoreSuite.scala
index 076139ebcb0..a47f860c8d6 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/GpuSemaphoreSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/GpuSemaphoreSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -86,15 +86,17 @@ class GpuSemaphoreSuite extends AnyFunSuite
 
   def assertAcquired(result: TryAcquireResult): Unit = result match {
     case SemaphoreAcquired => // NOOP
-    case AcquireFailed(_) =>
+    case _: AcquireFailed =>
       fail("The Semaphore was not acquired")
   }
 
   def assertNotAcquired(numExpectedWaiting: Int, result: TryAcquireResult): Unit = result match {
     case SemaphoreAcquired =>
       fail("The Semaphore was acquired when we didn't expect it")
-    case AcquireFailed(numWaiting) =>
-      assert(numWaiting == numExpectedWaiting, "The number of waiting tasks didn't match")
+    case failed: AcquireFailed =>
+      assert(
+        failed.numWaitingTasks == numExpectedWaiting,
+        "The number of waiting tasks didn't match")
   }
 
   test("multi tryAcquire") {
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/GpuSortRetrySuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/GpuSortRetrySuite.scala
index 6e1542f7631..e08c3d6b178 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/GpuSortRetrySuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/GpuSortRetrySuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2023-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2023-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -176,10 +176,14 @@ class GpuSortRetrySuite extends RmmSparkRetrySuiteBase with MockitoSugar {
   }
 
   test("GPU each batch sort with GpuRetryOOM") {
-    val eachBatchIter = GpuSortEachBatchIterator(
+    val eachBatchIter = new GpuSortEachBatchIterator(
       batchIter(2),
       gpuSorter,
-      singleBatch = false)
+      singleBatch = false,
+      opTime = NoopMetric,
+      sortTime = NoopMetric,
+      outputBatches = NoopMetric,
+      outputRows = NoopMetric)
     RmmSpark.forceRetryOOM(RmmSpark.getCurrentThreadId, 2,
       RmmSpark.OomInjectionType.GPU.ordinal, 0)
     while (eachBatchIter.hasNext) {
@@ -201,10 +205,14 @@ class GpuSortRetrySuite extends RmmSparkRetrySuiteBase with MockitoSugar {
   test("GPU each batch sort throws GpuSplitAndRetryOOM") {
     val inputIter = batchIter(2)
     try {
-      val eachBatchIter = GpuSortEachBatchIterator(
+      val eachBatchIter = new GpuSortEachBatchIterator(
         inputIter,
         gpuSorter,
-        singleBatch = false)
+        singleBatch = false,
+        opTime = NoopMetric,
+        sortTime = NoopMetric,
+        outputBatches = NoopMetric,
+        outputRows = NoopMetric)
       RmmSpark.forceSplitAndRetryOOM(RmmSpark.getCurrentThreadId, 1,
         RmmSpark.OomInjectionType.GPU.ordinal, 0)
       assertThrows[GpuSplitAndRetryOOM] {
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/MetaUtilsSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/MetaUtilsSuite.scala
index ebcee3d230e..1060fd62c4a 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/MetaUtilsSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/MetaUtilsSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -134,8 +134,9 @@ class MetaUtilsSuite extends AnyFunSuite {
       withResource(GpuPackedTableColumn.from(contigTable)) { uncompressedBatch =>
         val uncompressedMeta = MetaUtils.buildDegenerateTableMeta(uncompressedBatch)
         withResource(DeviceMemoryBuffer.allocate(0)) { buffer =>
-          val compressedTable = CompressedTable(0, uncompressedMeta, buffer)
-          withResource(GpuCompressedColumnVector.from(compressedTable)) { batch =>
+          val compressedTable = new CompressedTable(0, uncompressedMeta, buffer)
+          withResource(GpuCompressedColumnVector.from(
+              compressedTable.buffer, compressedTable.meta)) { batch =>
             val meta = MetaUtils.buildDegenerateTableMeta(batch)
             assertResult(null)(meta.bufferMeta)
             assertResult(0)(meta.rowCount)
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/WithRetrySuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/WithRetrySuite.scala
index 5346dbb3754..3bdb06086b3 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/WithRetrySuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/WithRetrySuite.scala
@@ -250,7 +250,7 @@ class WithRetrySuite
     val numSplits = 2
     var doThrow = numSplits
     var lastSplitSize = 0L
-    val myTarget = AutoCloseableTargetSize(initialValue, minValue)
+    val myTarget = new AutoCloseableTargetSize(initialValue, minValue)
     try {
       withRetry(myTarget, splitTargetSizeInHalfGpu) { attempt =>
         lastSplitSize = attempt.targetSize
@@ -274,7 +274,7 @@ class WithRetrySuite
     val dataSize = 200L  // less than targetSize/2=500, so halving targetSize is a no-op
     var doThrow = true
     var splitTargetUsed = 0L
-    val myTarget = AutoCloseableTargetSize(targetSize, minSize, dataSize)
+    val myTarget = new AutoCloseableTargetSize(targetSize, minSize, dataSize)
     try {
       withRetry(myTarget, splitTargetSizeInHalfGpu) { attempt =>
         splitTargetUsed = attempt.targetSize
@@ -300,7 +300,7 @@ class WithRetrySuite
     val childDataSize = 2L  // actual bytes in the smaller child; less than targetSize/2=50
     var doThrow = true
     var splitTargetUsed = 0L
-    val myTarget = AutoCloseableTargetSize(targetSize, minSize, childDataSize)
+    val myTarget = new AutoCloseableTargetSize(targetSize, minSize, childDataSize)
     try {
       withRetry(myTarget, splitTargetSizeInHalfGpu) { attempt =>
         splitTargetUsed = attempt.targetSize
@@ -321,7 +321,7 @@ class WithRetrySuite
     val numSplits = 3
     var doThrow = numSplits
     var lastSplitSize = 0L
-    val myTarget = AutoCloseableTargetSize(initialValue, minValue)
+    val myTarget = new AutoCloseableTargetSize(initialValue, minValue)
     try {
       assertThrows[GpuSplitAndRetryOOM] {
         withRetry(myTarget, splitTargetSizeInHalfGpu) { attempt =>
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClientSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClientSuite.scala
index 515ff75ffaa..2eb34347edf 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClientSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleClientSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -33,7 +33,7 @@ class RapidsShuffleClientSuite extends RapidsShuffleTestHelper {
   def prepareBufferReceiveState(
       tableMeta: TableMeta,
       bounceBuffer: BounceBuffer): BufferReceiveState = {
-    val ptr = PendingTransferRequest(client, tableMeta, mockHandler)
+    val ptr = new PendingTransferRequest(client, tableMeta, mockHandler)
     spy(new BufferReceiveState(123L, bounceBuffer, Seq(ptr), () => {}))
   }
 
@@ -42,7 +42,7 @@ class RapidsShuffleClientSuite extends RapidsShuffleTestHelper {
       bounceBuffer: BounceBuffer): BufferReceiveState = {
 
     val ptrs = tableMetas.map { tm =>
-      PendingTransferRequest(client, tm, mockHandler)
+      new PendingTransferRequest(client, tm, mockHandler)
     }
 
     spy(new BufferReceiveState(123L, bounceBuffer, ptrs, () => {}))
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIteratorSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIteratorSuite.scala
index af24b332c83..c9c67fb5185 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIteratorSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleIteratorSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -172,7 +172,7 @@ class RapidsShuffleIteratorSuite extends RapidsShuffleTestHelper {
       val ac = ArgumentCaptor.forClass(classOf[RapidsShuffleFetchHandler])
       when(mockTransport.makeClient(any())).thenReturn(client)
       doNothing().when(client).doFetch(any(), ac.capture())
-      val mockBuffer = RapidsShuffleHandle(mock[SpillableDeviceBufferHandle], null)
+      val mockBuffer = new RapidsShuffleHandle(mock[SpillableDeviceBufferHandle], null)
       when(mockBuffer.spillable.sizeInBytes).thenReturn(123L)
 
       val cb = new ColumnarBatch(Array.empty, 10)
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServerSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServerSuite.scala
index 8d7415fba04..9b0ca83b692 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServerSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleServerSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -57,7 +57,7 @@ class RapidsShuffleServerSuite extends RapidsShuffleTestHelper {
         fillBuffer(hostBuff)
         deviceBuffer.copyFromHostBuffer(hostBuff)
         val mockMeta = RapidsShuffleTestHelper.mockTableMeta(100000)
-        RapidsShuffleHandle(SpillableDeviceBufferHandle(deviceBuffer), mockMeta)
+        new RapidsShuffleHandle(SpillableDeviceBufferHandle(deviceBuffer), mockMeta)
       }
     }
     new MockRapidsShuffleRequestHandler(mockBuffers)
@@ -208,7 +208,7 @@ class RapidsShuffleServerSuite extends RapidsShuffleTestHelper {
       withResource(new RefCountedDirectByteBuffer(bb)) { _ =>
         val tableMeta = MetaUtils.buildTableMeta(1, 456, bb, 100)
         val testHandle = SpillableDeviceBufferHandle(DeviceMemoryBuffer.allocate(456))
-        val rapidsBuffer = RapidsShuffleHandle(testHandle, tableMeta)
+        val rapidsBuffer = new RapidsShuffleHandle(testHandle, tableMeta)
         when(mockRequestHandler.getShuffleHandle(ArgumentMatchers.eq(1)))
           .thenReturn(rapidsBuffer)
 
@@ -277,8 +277,8 @@ class RapidsShuffleServerSuite extends RapidsShuffleTestHelper {
       val ex = new IllegalStateException("something happened")
       when(mockHandleThatThrows.materialize()).thenThrow(ex)
 
-      val rapidsBuffer = RapidsShuffleHandle(mockHandle, tableMeta)
-      val rapidsBufferThatThrows = RapidsShuffleHandle(mockHandleThatThrows, tableMeta)
+      val rapidsBuffer = new RapidsShuffleHandle(mockHandle, tableMeta)
+      val rapidsBufferThatThrows = new RapidsShuffleHandle(mockHandleThatThrows, tableMeta)
 
       when(mockRequestHandler.getShuffleHandle(ArgumentMatchers.eq(1)))
         .thenReturn(rapidsBuffer)
@@ -359,7 +359,7 @@ class RapidsShuffleServerSuite extends RapidsShuffleTestHelper {
         val tableMeta = MetaUtils.buildTableMeta(tableId, 456, bb, 100)
         val rapidsBuffer = if (error) {
           val mockHandle = mock[SpillableDeviceBufferHandle]
-          val rapidsBuffer = RapidsShuffleHandle(mockHandle, tableMeta)
+          val rapidsBuffer = new RapidsShuffleHandle(mockHandle, tableMeta)
           when(mockHandle.sizeInBytes).thenReturn(tableMeta.bufferMeta().size())
           // mock an error with the copy
           when(rapidsBuffer.spillable.materialize())
@@ -369,7 +369,7 @@ class RapidsShuffleServerSuite extends RapidsShuffleTestHelper {
           rapidsBuffer
         } else {
           val testHandle = spy(SpillableDeviceBufferHandle(spy(DeviceMemoryBuffer.allocate(456))))
-          RapidsShuffleHandle(testHandle, tableMeta)
+          new RapidsShuffleHandle(testHandle, tableMeta)
         }
         when(mockRequestHandler.getShuffleHandle(ArgumentMatchers.eq(tableId)))
           .thenAnswer(_ => rapidsBuffer)
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIteratorSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIteratorSuite.scala
index 47d32633062..f24581451a2 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIteratorSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/shuffle/WindowedBlockIteratorSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -28,10 +28,10 @@ class WindowedBlockIteratorSuite extends RapidsShuffleTestHelper {
   }
 
   test ("1-byte+ ranges are allowed, but 0-byte or negative ranges are not") {
-    assertResult(1)(BlockRange(null, 123, 124).rangeSize())
-    assertResult(2)(BlockRange(null, 123, 125).rangeSize())
-    assertThrows[IllegalArgumentException](BlockRange(null, 123, 123))
-    assertThrows[IllegalArgumentException](BlockRange(null, 123, 122))
+    assertResult(1)(new BlockRange[BlockWithSize](null, 123, 124).rangeSize())
+    assertResult(2)(new BlockRange[BlockWithSize](null, 123, 125).rangeSize())
+    assertThrows[IllegalArgumentException](new BlockRange[BlockWithSize](null, 123, 123))
+    assertThrows[IllegalArgumentException](new BlockRange[BlockWithSize](null, 123, 122))
   }
 
   test ("0-byte blocks are not allowed") {
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/spill/SpillUnitTestBase.scala b/tests/src/test/scala/com/nvidia/spark/rapids/spill/SpillUnitTestBase.scala
index 2e57f128fc6..7c2fdc2afb6 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/spill/SpillUnitTestBase.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/spill/SpillUnitTestBase.scala
@@ -200,7 +200,7 @@ trait SpillUnitTestBase extends FunSuiteWithTempDir with MockitoSugar {
     withResource(codec.createBatchCompressor(0, Cuda.DEFAULT_STREAM)) { compressor =>
       compressor.addTableToCompress(buildContiguousTable(start, numRows))
       withResource(compressor.finish()) { compressed =>
-        GpuCompressedColumnVector.from(compressed.head)
+        GpuCompressedColumnVector.from(compressed.head.buffer, compressed.head.meta)
       }
     }
   }
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/unit/ComplexCreatorSizeEstimationTest.scala b/tests/src/test/scala/com/nvidia/spark/rapids/unit/ComplexCreatorSizeEstimationTest.scala
index bb6437fb6fb..dd9b1ae2737 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/unit/ComplexCreatorSizeEstimationTest.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/unit/ComplexCreatorSizeEstimationTest.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2025, NVIDIA CORPORATION.
+ * Copyright (c) 2025-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -52,7 +52,7 @@ class ComplexCreatorSizeEstimationTest extends GpuUnitTests {
         GpuColumnVector.getTotalDeviceMemoryUsed(proCb)
       }
       val estimatedSize = PreProjectSplitIterator.calcMinOutputSize(inCb,
-        GpuTieredProject(Seq(boundList)))
+        new GpuTieredProject(Seq(boundList)))
       assertResult(actualSize)(estimatedSize)
     }
   }
diff --git a/tests/src/test/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowSuite.scala b/tests/src/test/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowSuite.scala
index fbdda7e2de9..8a61fe51169 100644
--- a/tests/src/test/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowSuite.scala
+++ b/tests/src/test/scala/com/nvidia/spark/rapids/window/GpuUnboundedToUnboundedAggWindowSuite.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2024-2025, NVIDIA CORPORATION.
+ * Copyright (c) 2024-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -40,7 +40,7 @@ class GpuUnboundedToUnboundedAggWindowSuite extends RmmSparkRetrySuiteBase {
     val finalProject = GpuUnboundedToUnboundedAggWindowIterator.computeFinalProject(
       rideAlongOutput, repeatOutput, repeatOutput ++ rideAlongOutput, Map.empty)
 
-    val conf = GpuUnboundedToUnboundedAggStages(Seq.empty, Seq.empty, Seq.empty,
+    val conf = new GpuUnboundedToUnboundedAggStages(Seq.empty, Seq.empty, Seq.empty,
                                                 Seq.empty, finalProject)
 
     def makeRepeatCb(): SpillableColumnarBatch = {
@@ -89,7 +89,7 @@ class GpuUnboundedToUnboundedAggWindowSuite extends RmmSparkRetrySuiteBase {
       rowsRemaining -= rowsToAdd
       rideAlongList.add(makeRideAlongCb(rowsToAdd.toInt))
     }
-    val inputIter = Seq(SecondPassAggResult(rideAlongList, makeRepeatCb())).toIterator
+    val inputIter = Seq(new SecondPassAggResult(rideAlongList, makeRepeatCb())).toIterator
     val splitIter = new GpuUnboundedToUnboundedAggSliceBySizeIterator(inputIter, conf,
       targetSizeBytes, NoopMetric)
     val repeatIter = new GpuUnboundedToUnboundedAggFinalIterator(splitIter, conf,
diff --git a/tests/src/test/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriterSuite.scala b/tests/src/test/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriterSuite.scala
index 4b39c53697f..a2dceda1420 100644
--- a/tests/src/test/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriterSuite.scala
+++ b/tests/src/test/scala/org/apache/spark/sql/rapids/GpuFileFormatDataWriterSuite.scala
@@ -156,7 +156,7 @@ class GpuFileFormatDataWriterSuite extends AnyFunSuite with BeforeAndAfterEach {
         dataSpec = allCols
       }
       if (numBuckets != 0) {
-        bucketSpec = Some(GpuWriterBucketSpec(
+        bucketSpec = Some(new GpuWriterBucketSpec(
           GpuPmod(GpuMurmur3Hash(Seq(allCols.last), 42), GpuLiteral(Math.abs(numBuckets))),
           _ => ""))
       }
diff --git a/tests/src/test/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala b/tests/src/test/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala
index 0e2f4aa1f74..14ef01fe928 100644
--- a/tests/src/test/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala
+++ b/tests/src/test/spark330/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala
@@ -117,7 +117,7 @@ abstract class RapidsShuffleTestHelper
 
   def getSendBounceBuffer(size: Long): SendBounceBuffers = {
     val db = DeviceMemoryBuffer.allocate(size)
-    SendBounceBuffers(new BounceBuffer(db) {
+    new SendBounceBuffers(new BounceBuffer(db) {
       override def free(bb: BounceBuffer): Unit = {
         db.close()
       }
diff --git a/tests/src/test/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala b/tests/src/test/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala
index 66c0f4925de..73ad14721c1 100644
--- a/tests/src/test/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala
+++ b/tests/src/test/spark340/scala/com/nvidia/spark/rapids/shuffle/RapidsShuffleTestHelper.scala
@@ -131,7 +131,7 @@ abstract class RapidsShuffleTestHelper
 
   def getSendBounceBuffer(size: Long): SendBounceBuffers = {
     val db = DeviceMemoryBuffer.allocate(size)
-    SendBounceBuffers(new BounceBuffer(db) {
+    new SendBounceBuffers(new BounceBuffer(db) {
       override def free(bb: BounceBuffer): Unit = {
         db.close()
       }
diff --git a/udf-compiler/src/main/scala-2.12/com/nvidia/spark/udf/Instruction.scala b/udf-compiler/src/main/scala-2.12/com/nvidia/spark/udf/Instruction.scala
index 7adaff26d99..8ce57b84f33 100644
--- a/udf-compiler/src/main/scala-2.12/com/nvidia/spark/udf/Instruction.scala
+++ b/udf-compiler/src/main/scala-2.12/com/nvidia/spark/udf/Instruction.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,14 +21,13 @@ import java.nio.charset.Charset
 import com.nvidia.spark.rapids.shims.ShimExpression
 import com.nvidia.spark.udf.CatalystExpressionBuilder.simplify
 import javassist.bytecode.{CodeIterator, Opcode}
+import org.slf4j.LoggerFactory
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.analysis.TypeCoercion
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.types._
 
-
 private[udf] object Repr {
 
   abstract class CompilerInternal(name: String) extends ShimExpression {
@@ -154,7 +153,7 @@ private[udf] object Repr {
               if (elemType == t) {
                 Seq(args.head)
               } else {
-                Seq(Cast(args.head, t))
+                Seq(new Cast(args.head, t, None))
               }
             }
           }
@@ -216,7 +215,7 @@ private[udf] object Repr {
  * @param opcode
  * @param operand
  */
-case class Instruction(opcode: Int, operand: Int, instructionStr: String) extends Logging {
+case class Instruction(opcode: Int, operand: Int, instructionStr: String) {
   def makeState(lambdaReflection: LambdaReflection, basicBlock: BB, state: State): State = {
     val st = opcode match {
       case Opcode.ALOAD_0 | Opcode.DLOAD_0 | Opcode.FLOAD_0 |
@@ -321,7 +320,10 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
           })
       case _ => throw new SparkException("Unsupported instruction: " + instructionStr)
     }
-    logDebug(s"[Instruction] ${instructionStr} got new state: ${st} from state: ${state}")
+    if (Instruction.log.isDebugEnabled) {
+      Instruction.log.debug(
+        s"[Instruction] ${instructionStr} got new state: ${st} from state: ${state}")
+    }
     st
   }
 
@@ -441,7 +443,7 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
       state: State,
       dataType: DataType): State = {
     val State(locals, top :: rest, cond, expr) = state
-    State(locals, Cast(top, dataType) :: rest, cond, expr)
+    State(locals, new Cast(top, dataType, None) :: rest, cond, expr)
   }
 
   private def checkcast(lambdaReflection: LambdaReflection, state: State): State = {
@@ -774,13 +776,13 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
         EndsWith(args.head, args.last)
       case "equals" =>
         checkArgs(methodName, List(StringType, StringType), args)
-        Cast(EqualNullSafe(args.head, args.last), IntegerType)
+        new Cast(EqualNullSafe(args.head, args.last), IntegerType, None)
       case "equalsIgnoreCase" =>
         checkArgs(methodName, List(StringType, StringType), args)
-        Cast(EqualNullSafe(Upper(args.head), Upper(args.last)), IntegerType)
+        new Cast(EqualNullSafe(Upper(args.head), Upper(args.last)), IntegerType, None)
       case "isEmpty" =>
         checkArgs(methodName, List(StringType), args)
-        Cast(EqualTo(Length(args.head), Literal(0)), IntegerType)
+        new Cast(EqualTo(Length(args.head), Literal(0)), IntegerType, None)
       case "length" =>
         checkArgs(methodName, List(StringType), args)
         Length(args.head)
@@ -836,7 +838,7 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
               s"String.${methodName}: " +
               s"${args.head.dataType}")
         }
-        Cast(args.head, StringType)
+        new Cast(args.head, StringType, None)
       case "indexOf" =>
         if (args.length == 2) {
           if (args(1).dataType == StringType) {
@@ -884,10 +886,10 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
       case "getBytes" =>
         if (args.length == 1) {
           checkArgs(methodName, List(StringType), args)
-          Encode(args.head, Literal(Charset.defaultCharset.toString))
+          new Encode(args.head, Literal(Charset.defaultCharset.toString))
         } else if (args.length == 2) {
           checkArgs(methodName, List(StringType, StringType), args)
-          Encode(args.head, args.last)
+          new Encode(args.head, args.last)
         } else {
           throw new SparkException(
             s"String.${methodName} operation expects 1 or 2 argument(s), " +
@@ -953,6 +955,8 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
  * Ultimately, every opcode will have to be covered here.
  */
 object Instruction {
+  private val log = LoggerFactory.getLogger(classOf[Instruction])
+
   def apply(codeIterator: CodeIterator, offset: Int, instructionStr: String): Instruction = {
     val opcode: Int = codeIterator.byteAt(offset)
     val operand: Int = opcode match {
diff --git a/udf-compiler/src/main/scala-2.13/com/nvidia/spark/udf/Instruction.scala b/udf-compiler/src/main/scala-2.13/com/nvidia/spark/udf/Instruction.scala
index 36fe79da384..fbfe59b6bf7 100644
--- a/udf-compiler/src/main/scala-2.13/com/nvidia/spark/udf/Instruction.scala
+++ b/udf-compiler/src/main/scala-2.13/com/nvidia/spark/udf/Instruction.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -21,14 +21,13 @@ import java.nio.charset.Charset
 import com.nvidia.spark.rapids.shims.ShimExpression
 import com.nvidia.spark.udf.CatalystExpressionBuilder.simplify
 import javassist.bytecode.{CodeIterator, Opcode}
+import org.slf4j.LoggerFactory
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.analysis.TypeCoercion
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.types._
 
-
 private[udf] object Repr {
 
   abstract class CompilerInternal(name: String) extends ShimExpression {
@@ -149,7 +148,7 @@ private[udf] object Repr {
               if (elemType == t) {
                 Seq(args.head)
               } else {
-                Seq(Cast(args.head, t))
+                Seq(new Cast(args.head, t, None))
               }
             }
           }
@@ -211,7 +210,7 @@ private[udf] object Repr {
  * @param opcode
  * @param operand
  */
-case class Instruction(opcode: Int, operand: Int, instructionStr: String) extends Logging {
+case class Instruction(opcode: Int, operand: Int, instructionStr: String) {
   def makeState(lambdaReflection: LambdaReflection, basicBlock: BB, state: State): State = {
     val st = opcode match {
       case Opcode.ALOAD_0 | Opcode.DLOAD_0 | Opcode.FLOAD_0 |
@@ -322,7 +321,10 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
         })
       case _ => throw new SparkException("Unsupported instruction: " + instructionStr)
     }
-    logDebug(s"[Instruction] ${instructionStr} got new state: ${st} from state: ${state}")
+    if (Instruction.log.isDebugEnabled) {
+      Instruction.log.debug(
+        s"[Instruction] ${instructionStr} got new state: ${st} from state: ${state}")
+    }
     st
   }
 
@@ -442,7 +444,7 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
       state: State,
       dataType: DataType): State = {
     val State(locals, top :: rest, cond, expr) = state
-    State(locals, Cast(top, dataType) :: rest, cond, expr)
+    State(locals, new Cast(top, dataType, None) :: rest, cond, expr)
   }
 
   private def checkcast(lambdaReflection: LambdaReflection, state: State): State = {
@@ -800,13 +802,13 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
         EndsWith(args.head, args.last)
       case "equals" =>
         checkArgs(methodName, List(StringType, StringType), args)
-        Cast(EqualNullSafe(args.head, args.last), IntegerType)
+        new Cast(EqualNullSafe(args.head, args.last), IntegerType, None)
       case "equalsIgnoreCase" =>
         checkArgs(methodName, List(StringType, StringType), args)
-        Cast(EqualNullSafe(Upper(args.head), Upper(args.last)), IntegerType)
+        new Cast(EqualNullSafe(Upper(args.head), Upper(args.last)), IntegerType, None)
       case "isEmpty" =>
         checkArgs(methodName, List(StringType), args)
-        Cast(EqualTo(Length(args.head), Literal(0)), IntegerType)
+        new Cast(EqualTo(Length(args.head), Literal(0)), IntegerType, None)
       case "length" =>
         checkArgs(methodName, List(StringType), args)
         Length(args.head)
@@ -862,7 +864,7 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
               s"String.${methodName}: " +
               s"${args.head.dataType}")
         }
-        Cast(args.head, StringType)
+        new Cast(args.head, StringType, None)
       case "indexOf" =>
         if (args.length == 2) {
           if (args(1).dataType == StringType) {
@@ -910,10 +912,10 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
       case "getBytes" =>
         if (args.length == 1) {
           checkArgs(methodName, List(StringType), args)
-          Encode(args.head, Literal(Charset.defaultCharset.toString))
+          new Encode(args.head, Literal(Charset.defaultCharset.toString))
         } else if (args.length == 2) {
           checkArgs(methodName, List(StringType, StringType), args)
-          Encode(args.head, args.last)
+          new Encode(args.head, args.last)
         } else {
           throw new SparkException(
             s"String.${methodName} operation expects 1 or 2 argument(s), " +
@@ -979,6 +981,8 @@ case class Instruction(opcode: Int, operand: Int, instructionStr: String) extend
  * Ultimately, every opcode will have to be covered here.
  */
 object Instruction {
+  private val log = LoggerFactory.getLogger(classOf[Instruction])
+
   def apply(codeIterator: CodeIterator, offset: Int, instructionStr: String): Instruction = {
     val opcode: Int = codeIterator.byteAt(offset)
     val operand: Int = opcode match {
diff --git a/udf-compiler/src/main/scala/com/nvidia/spark/udf/CFG.scala b/udf-compiler/src/main/scala/com/nvidia/spark/udf/CFG.scala
index 34472e890e0..1aa76958675 100644
--- a/udf-compiler/src/main/scala/com/nvidia/spark/udf/CFG.scala
+++ b/udf-compiler/src/main/scala/com/nvidia/spark/udf/CFG.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2024, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -22,9 +22,9 @@ import scala.collection.immutable.{HashMap, SortedMap, SortedSet}
 import CatalystExpressionBuilder.simplify
 import javassist.bytecode.{CodeIterator, ConstPool, InstructionPrinter, Opcode}
 import javassist.bytecode.analysis.Util
+import org.slf4j.LoggerFactory
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions._
 
 /**
@@ -43,7 +43,7 @@ import org.apache.spark.sql.catalyst.expressions._
  *
  * @param instructionTable
  */
-case class BB(instructionTable: SortedMap[Int, Instruction]) extends Logging {
+case class BB(instructionTable: SortedMap[Int, Instruction]) {
   def offset: Int = instructionTable.head._1
 
   def last: (Int, Instruction) = instructionTable.last
@@ -54,18 +54,24 @@ case class BB(instructionTable: SortedMap[Int, Instruction]) extends Logging {
 
   def propagateState(cfg: CFG, states: Map[BB, State]): Map[BB, State] = {
     val state@State(_, _, cond, expr) = states(this)
-    logDebug(s"[BB.propagateState] propagating condition: ${cond} from state ${state} " +
-        s"onto states: ${states}")
+    if (BB.log.isDebugEnabled) {
+      BB.log.debug(s"[BB.propagateState] propagating condition: ${cond} from state ${state} " +
+          s"onto states: ${states}")
+    }
     lastInstruction.opcode match {
       case Opcode.IF_ICMPEQ | Opcode.IF_ICMPNE | Opcode.IF_ICMPLT |
            Opcode.IF_ICMPGE | Opcode.IF_ICMPGT | Opcode.IF_ICMPLE |
            Opcode.IFLT | Opcode.IFLE | Opcode.IFGT | Opcode.IFGE |
            Opcode.IFEQ | Opcode.IFNE | Opcode.IFNULL | Opcode.IFNONNULL => {
-        logTrace(s"[BB.propagateState] lastInstruction: ${lastInstruction.instructionStr}")
+        if (BB.log.isTraceEnabled) {
+          BB.log.trace(s"[BB.propagateState] lastInstruction: ${lastInstruction.instructionStr}")
+        }
 
         // An if statement has both a false and a true successor
         val (0, falseSucc) :: (1, trueSucc) :: Nil = cfg.successor(this)
-        logTrace(s"[BB.propagateState] falseSucc ${falseSucc} trueSuccc ${trueSucc}")
+        if (BB.log.isTraceEnabled) {
+          BB.log.trace(s"[BB.propagateState] falseSucc ${falseSucc} trueSuccc ${trueSucc}")
+        }
 
         // cond is the entry condition into the condition block, and expr is the
         // actual condition for IF* (see Instruction.ifOp).
@@ -80,7 +86,9 @@ case class BB(instructionTable: SortedMap[Int, Instruction]) extends Logging {
         val falseState = state.copy(cond = simplify(And(cond, Not(expr.get))))
         val trueState = state.copy(cond = simplify(And(cond, expr.get)))
 
-        logDebug(s"[BB.propagateState] States before: ${states}")
+        if (BB.log.isDebugEnabled) {
+          BB.log.debug(s"[BB.propagateState] States before: ${states}")
+        }
 
         // Each successor may already have the state populated if it has
         // multiple predecessors.
@@ -88,7 +96,9 @@ case class BB(instructionTable: SortedMap[Int, Instruction]) extends Logging {
         val newStates = (states
             + (falseSucc -> falseState.merge(states.get(falseSucc)))
             + (trueSucc -> trueState.merge(states.get(trueSucc))))
-        logDebug(s"[BB.propagateState] States after: ${newStates}")
+        if (BB.log.isDebugEnabled) {
+          BB.log.debug(s"[BB.propagateState] States after: ${newStates}")
+        }
         newStates
       }
       case Opcode.TABLESWITCH | Opcode.LOOKUPSWITCH =>
@@ -120,6 +130,10 @@ case class BB(instructionTable: SortedMap[Int, Instruction]) extends Logging {
   }
 }
 
+object BB {
+  private val log = LoggerFactory.getLogger(classOf[BB])
+}
+
 /**
  * The Control Flow Graph object.
  *
diff --git a/udf-compiler/src/main/scala/com/nvidia/spark/udf/CatalystExpressionBuilder.scala b/udf-compiler/src/main/scala/com/nvidia/spark/udf/CatalystExpressionBuilder.scala
index 2628b17457f..919a63b59d9 100644
--- a/udf-compiler/src/main/scala/com/nvidia/spark/udf/CatalystExpressionBuilder.scala
+++ b/udf-compiler/src/main/scala/com/nvidia/spark/udf/CatalystExpressionBuilder.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2023, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -19,9 +19,9 @@ package com.nvidia.spark.udf
 import scala.annotation.tailrec
 
 import javassist.CtClass
+import org.slf4j.LoggerFactory
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions._
 import org.apache.spark.sql.types._
 
@@ -42,7 +42,7 @@ import org.apache.spark.sql.types._
  *
  * @param function the original Scala UDF provided by the user
  */
-case class CatalystExpressionBuilder(private val function: AnyRef) extends Logging {
+case class CatalystExpressionBuilder(private val function: AnyRef) {
   final private val lambdaReflection: LambdaReflection = LambdaReflection(function)
 
   final private val cfg = CFG(lambdaReflection)
@@ -72,23 +72,28 @@ case class CatalystExpressionBuilder(private val function: AnyRef) extends Loggi
     // pick first of the Basic Blocks, and start recursing
     val entryBlock = cfg.basicBlocks.head
 
-    logDebug(s"[CatalystExpressionBuilder] Attempting to compile: ${function}, " +
-        s"with children: ${children}, " + s"entry block: ${entryBlock}, and " +
-        s"entry state: ${entryState}")
+    if (CatalystExpressionBuilder.log.isDebugEnabled) {
+      CatalystExpressionBuilder.log.debug(
+        s"[CatalystExpressionBuilder] Attempting to compile: ${function}, " +
+            s"with children: ${children}, " + s"entry block: ${entryBlock}, and " +
+            s"entry state: ${entryState}")
+    }
 
     // start recursing
     val compiled = doCompile(List(entryBlock), Map(entryBlock -> entryState)).map { e =>
       if (lambdaReflection.ret == CtClass.booleanType) {
         // JVM bytecode returns an integer value when the return type is
         // boolean, hence the cast.
-        CatalystExpressionBuilder.simplify(Cast(e, BooleanType))
+        CatalystExpressionBuilder.simplify(new Cast(e, BooleanType, None))
       } else {
         e
       }
     }
 
     if (compiled.isEmpty) {
-      logDebug(s"[CatalystExpressionBuilder] failed to compile")
+      if (CatalystExpressionBuilder.log.isDebugEnabled) {
+        CatalystExpressionBuilder.log.debug(s"[CatalystExpressionBuilder] failed to compile")
+      }
     } else {
       val expr = compiled.get
       val internal = expr.find(_.isInstanceOf[Repr.CompilerInternal])
@@ -96,7 +101,10 @@ case class CatalystExpressionBuilder(private val function: AnyRef) extends Loggi
         throw new IllegalStateException(
           s"compiled UDF has compiler internal expression $e: $expr")
       }
-      logDebug(s"[CatalystExpressionBuilder] compiled expression: $expr")
+      if (CatalystExpressionBuilder.log.isDebugEnabled) {
+        CatalystExpressionBuilder.log.debug(
+          s"[CatalystExpressionBuilder] compiled expression: $expr")
+      }
     }
 
     compiled
@@ -156,7 +164,9 @@ case class CatalystExpressionBuilder(private val function: AnyRef) extends Loggi
     // find the state associated with this BB
     val state: State = states(basicBlock)
 
-    logTrace(s"States for basic block ${basicBlock} => ${state}")
+    if (CatalystExpressionBuilder.log.isTraceEnabled) {
+      CatalystExpressionBuilder.log.trace(s"States for basic block ${basicBlock} => ${state}")
+    }
 
     /**
      * Iterate through the instruction table for the BB:
@@ -274,7 +284,9 @@ case class CatalystExpressionBuilder(private val function: AnyRef) extends Loggi
  * simplify a directly translated catalyst expression (from bytecode) into something simpler
  * that the remaining catalyst optimizations can handle.
  */
-object CatalystExpressionBuilder extends Logging {
+object CatalystExpressionBuilder {
+  private val log = LoggerFactory.getLogger(classOf[CatalystExpressionBuilder])
+
   /** simplify: given a raw converted catalyst expression, attempt to match patterns to simplify
    * before handing it over to catalyst optimizers (the LogicalPlan does this later).
    *
@@ -473,8 +485,8 @@ object CatalystExpressionBuilder extends Logging {
           ce.child match {
             case If(c, t, f) =>
           simplifyExpr(If(simplifyExpr(c),
-            simplifyExpr(Cast(t, BooleanType, ce.timeZoneId)),
-            simplifyExpr(Cast(f, BooleanType, ce.timeZoneId))))
+            simplifyExpr(new Cast(t, BooleanType, ce.timeZoneId)),
+            simplifyExpr(new Cast(f, BooleanType, ce.timeZoneId))))
           }
         case If(c, Repr.ArrayBuffer(t), Repr.ArrayBuffer(f)) => Repr.ArrayBuffer(If(c, t, f))
         case If(c, Repr.StringBuilder(t), Repr.StringBuilder(f)) => Repr.StringBuilder(If(c, t, f))
@@ -483,7 +495,10 @@ object CatalystExpressionBuilder extends Logging {
         case If(c, t, f) => If(simplifyExpr(c), simplifyExpr(t), simplifyExpr(f))
         case _ => expr
       }
-      logDebug(s"[CatalystExpressionBuilder] simplify: ${expr} ==> ${res}")
+      if (CatalystExpressionBuilder.log.isDebugEnabled) {
+        CatalystExpressionBuilder.log.debug(
+          s"[CatalystExpressionBuilder] simplify: ${expr} ==> ${res}")
+      }
       res
     }
 
diff --git a/udf-compiler/src/main/scala/com/nvidia/spark/udf/GpuScalaUDF.scala b/udf-compiler/src/main/scala/com/nvidia/spark/udf/GpuScalaUDF.scala
index bee2f73a3bf..7ef6ccff0e4 100644
--- a/udf-compiler/src/main/scala/com/nvidia/spark/udf/GpuScalaUDF.scala
+++ b/udf-compiler/src/main/scala/com/nvidia/spark/udf/GpuScalaUDF.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2022, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -19,15 +19,15 @@ package com.nvidia.spark.udf
 import scala.util.control.NonFatal
 
 import com.nvidia.spark.rapids.shims.ShimExpression
+import org.slf4j.LoggerFactory
 
 import org.apache.spark.SparkException
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.expressions.{Expression, ScalaUDF}
 import org.apache.spark.sql.catalyst.expressions.codegen.{CodegenContext, ExprCode}
 import org.apache.spark.sql.types.DataType
 
-case class GpuScalaUDFLogical(udf: ScalaUDF) extends ShimExpression with Logging {
+case class GpuScalaUDFLogical(udf: ScalaUDF) extends ShimExpression {
   override def nullable: Boolean = udf.nullable
 
   override def eval(input: InternalRow): Any = {
@@ -53,15 +53,21 @@ case class GpuScalaUDFLogical(udf: ScalaUDF) extends ShimExpression with Logging
     } catch {
       case e: SparkException =>
         val udfName = udf.udfName.getOrElse("<unknown>")
-        logDebug(s"UDF $udfName compilation failure: $e")
+        if (GpuScalaUDFLogical.log.isDebugEnabled) {
+          GpuScalaUDFLogical.log.debug(s"UDF $udfName compilation failure: $e")
+        }
         if (isTestEnabled) {
           throw e
         }
         udf
       case NonFatal(e) =>
         val udfName = udf.udfName.getOrElse("<unknown>")
-        logWarning(s"Unable to translate UDF $udfName: $e")
+        GpuScalaUDFLogical.log.warn(s"Unable to translate UDF $udfName: $e")
         udf
     }
   }
 }
+
+object GpuScalaUDFLogical {
+  private val log = LoggerFactory.getLogger(classOf[GpuScalaUDFLogical])
+}
diff --git a/udf-compiler/src/main/scala/com/nvidia/spark/udf/LogicalPlanRules.scala b/udf-compiler/src/main/scala/com/nvidia/spark/udf/LogicalPlanRules.scala
index e9732e064c7..41373b330cf 100644
--- a/udf-compiler/src/main/scala/com/nvidia/spark/udf/LogicalPlanRules.scala
+++ b/udf-compiler/src/main/scala/com/nvidia/spark/udf/LogicalPlanRules.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2021, NVIDIA CORPORATION.
+ * Copyright (c) 2021-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -19,14 +19,13 @@ package com.nvidia.spark.udf
 import ai.rapids.cudf.{NvtxColor, NvtxRange}
 import com.nvidia.spark.rapids.RapidsConf
 
-import org.apache.spark.internal.Logging
 import org.apache.spark.sql.catalyst.expressions.{Expression, NamedExpression, ScalaUDF}
 import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, Project}
 import org.apache.spark.sql.catalyst.rules.Rule
 import org.apache.spark.sql.rapids.GpuScalaUDF.getRapidsUDFInstance
 
 
-case class LogicalPlanRules() extends Rule[LogicalPlan] with Logging {
+class LogicalPlanRules extends Rule[LogicalPlan] {
   def replacePartialFunc(plan: LogicalPlan): PartialFunction[Expression, Expression] = {
     case d: Expression => {
       val nvtx = new NvtxRange("replace UDF", NvtxColor.BLUE)
diff --git a/udf-compiler/src/main/scala/com/nvidia/spark/udf/State.scala b/udf-compiler/src/main/scala/com/nvidia/spark/udf/State.scala
index 114469ba019..7d4c76b5365 100644
--- a/udf-compiler/src/main/scala/com/nvidia/spark/udf/State.scala
+++ b/udf-compiler/src/main/scala/com/nvidia/spark/udf/State.scala
@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2019-2020, NVIDIA CORPORATION.
+ * Copyright (c) 2019-2026, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -89,8 +89,8 @@ case class State(locals: IndexedSeq[Expression],
           val commonType = TypeCoercion.findTightestCommonType(l1.dataType, l2.dataType)
           commonType.fold(throw new SparkException(s"Conditional type check failure")){
             t => simplify(If(cond,
-                             if (t == l1.dataType) l1 else Cast(l1, t),
-                             if (t == l2.dataType) l2 else Cast(l2, t)))
+                             if (t == l1.dataType) l1 else new Cast(l1, t, None),
+                             if (t == l2.dataType) l2 else new Cast(l2, t, None)))
           }
       }
       // At the end of the compliation, the expression at the top of stack is