From d8476ebfa0356f23d1f552969b5c94b34684bd2b Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 05:56:04 +0000
Subject: [PATCH 01/12] [GLUTEN-11550][UT] Fix GlutenSQLExecutionSuite

Inject GlutenPlugin via System.setProperty so per-test SparkSessions
created by the parent suite load it. Use GlutenTestsCommonTrait to
avoid creating a persistent session that conflicts with per-test
SparkContext creation.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../utils/velox/VeloxTestSettings.scala       |  2 +-
 .../execution/GlutenSQLExecutionSuite.scala   | 25 +++++++++++++++++--
 .../utils/velox/VeloxTestSettings.scala       |  2 +-
 .../execution/GlutenSQLExecutionSuite.scala   | 25 +++++++++++++++++--
 4 files changed, 48 insertions(+), 6 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index d0716932b756..026710ef85fa 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -715,7 +715,7 @@ class VeloxTestSettings extends BackendTestSettings {
   // TODO: 4.x enableSuite[GlutenRemoveRedundantProjectsSuite]  // 14 failures
   // TODO: 4.x enableSuite[GlutenRemoveRedundantSortsSuite]  // 1 failure
   enableSuite[GlutenRowToColumnConverterSuite]
-  // TODO: 4.x enableSuite[GlutenSQLExecutionSuite]  // 1 failure
+  enableSuite[GlutenSQLExecutionSuite]
   enableSuite[GlutenSQLFunctionSuite]
   // TODO: 4.x enableSuite[GlutenSQLJsonProtocolSuite]  // 1 failure
   // TODO: 4.x enableSuite[GlutenShufflePartitionsUtilSuite]  // 1 failure
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala
index 51c06b3b6900..d7df069d4447 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala
@@ -16,6 +16,27 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenSQLExecutionSuite extends SQLExecutionSuite with GlutenTestsTrait {}
+class GlutenSQLExecutionSuite extends SQLExecutionSuite with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    // Inject GlutenPlugin so per-test SparkSessions created by the parent suite load it.
+    // SparkConf reads system properties prefixed with "spark." as defaults.
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 47a1ff3d66e7..033d1abb0eb4 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -685,7 +685,7 @@ class VeloxTestSettings extends BackendTestSettings {
   // TODO: 4.x enableSuite[GlutenRemoveRedundantProjectsSuite]  // 14 failures
   // TODO: 4.x enableSuite[GlutenRemoveRedundantSortsSuite]  // 1 failure
   enableSuite[GlutenRowToColumnConverterSuite]
-  // TODO: 4.x enableSuite[GlutenSQLExecutionSuite]  // 1 failure
+  enableSuite[GlutenSQLExecutionSuite]
   enableSuite[GlutenSQLFunctionSuite]
   // TODO: 4.x enableSuite[GlutenSQLJsonProtocolSuite]  // 1 failure
   // TODO: 4.x enableSuite[GlutenShufflePartitionsUtilSuite]  // 1 failure
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala
index 27865af762ec..d7df069d4447 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLExecutionSuite.scala
@@ -16,6 +16,27 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.shim.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenSQLExecutionSuite extends SQLExecutionSuite with GlutenTestsTrait {}
+class GlutenSQLExecutionSuite extends SQLExecutionSuite with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    // Inject GlutenPlugin so per-test SparkSessions created by the parent suite load it.
+    // SparkConf reads system properties prefixed with "spark." as defaults.
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}

From 5ff4f5b6586f0edc5ae0f62511faad7ad6b65cac Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 06:03:00 +0000
Subject: [PATCH 02/12] [GLUTEN-11550][UT] Fix GlutenSQLJsonProtocolSuite,
 GlutenShufflePartitionsUtilSuite, GlutenExternalAppendOnlyUnsafeRowArraySuite

Same pattern as GlutenSQLExecutionSuite: these suites create per-test
SparkContexts which conflict with GlutenTestsTrait's persistent session.
Switch to GlutenTestsCommonTrait + inject GlutenPlugin via System.setProperty
so each test's SparkSession loads it.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../utils/velox/VeloxTestSettings.scala       |  6 ++---
 ...xternalAppendOnlyUnsafeRowArraySuite.scala | 23 +++++++++++++++--
 .../GlutenSQLJsonProtocolSuite.scala          | 23 +++++++++++++++--
 .../GlutenShufflePartitionsUtilSuite.scala    | 25 +++++++++++++++++--
 .../utils/velox/VeloxTestSettings.scala       |  6 ++---
 ...xternalAppendOnlyUnsafeRowArraySuite.scala | 23 +++++++++++++++--
 .../GlutenSQLJsonProtocolSuite.scala          | 23 +++++++++++++++--
 .../GlutenShufflePartitionsUtilSuite.scala    | 25 +++++++++++++++++--
 8 files changed, 136 insertions(+), 18 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 026710ef85fa..f94e51e2325b 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -699,7 +699,7 @@ class VeloxTestSettings extends BackendTestSettings {
   // TODO: 4.x enableSuite[GlutenDataSourceScanExecRedactionSuite]  // 2 failures
   // TODO: 4.x enableSuite[GlutenDataSourceV2ScanExecRedactionSuite]  // 2 failures
   enableSuite[GlutenExecuteImmediateEndToEndSuite]
-  // TODO: 4.x enableSuite[GlutenExternalAppendOnlyUnsafeRowArraySuite]  // 14 failures
+  enableSuite[GlutenExternalAppendOnlyUnsafeRowArraySuite]
   enableSuite[GlutenGlobalTempViewSuite]
   enableSuite[GlutenGlobalTempViewTestSuite]
   enableSuite[GlutenGroupedIteratorSuite]
@@ -717,8 +717,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenRowToColumnConverterSuite]
   enableSuite[GlutenSQLExecutionSuite]
   enableSuite[GlutenSQLFunctionSuite]
-  // TODO: 4.x enableSuite[GlutenSQLJsonProtocolSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenShufflePartitionsUtilSuite]  // 1 failure
+  enableSuite[GlutenSQLJsonProtocolSuite]
+  enableSuite[GlutenShufflePartitionsUtilSuite]
   // TODO: 4.x enableSuite[GlutenSimpleSQLViewSuite]  // 1 failure
   // TODO: 4.x enableSuite[GlutenSparkPlanSuite]  // 1 failure
   enableSuite[GlutenSparkPlannerSuite]
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala
index f947c4f406aa..cd64b5e55e1f 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala
@@ -16,8 +16,27 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
 class GlutenExternalAppendOnlyUnsafeRowArraySuite
   extends ExternalAppendOnlyUnsafeRowArraySuite
-  with GlutenTestsTrait {}
+  with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala
index 7ce28aae8917..f868ebfd2998 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala
@@ -16,6 +16,25 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenSQLJsonProtocolSuite extends SQLJsonProtocolSuite with GlutenTestsTrait {}
+class GlutenSQLJsonProtocolSuite extends SQLJsonProtocolSuite with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala
index 866d6cea5423..f56e0cc3b8ef 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala
@@ -16,6 +16,27 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenShufflePartitionsUtilSuite extends ShufflePartitionsUtilSuite with GlutenTestsTrait {}
+class GlutenShufflePartitionsUtilSuite
+  extends ShufflePartitionsUtilSuite
+  with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 033d1abb0eb4..1ffccf3e9852 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -669,7 +669,7 @@ class VeloxTestSettings extends BackendTestSettings {
   // TODO: 4.x enableSuite[GlutenDataSourceScanExecRedactionSuite]  // 2 failures
   // TODO: 4.x enableSuite[GlutenDataSourceV2ScanExecRedactionSuite]  // 2 failures
   enableSuite[GlutenExecuteImmediateEndToEndSuite]
-  // TODO: 4.x enableSuite[GlutenExternalAppendOnlyUnsafeRowArraySuite]  // 14 failures
+  enableSuite[GlutenExternalAppendOnlyUnsafeRowArraySuite]
   enableSuite[GlutenGlobalTempViewSuite]
   enableSuite[GlutenGlobalTempViewTestSuite]
   enableSuite[GlutenGroupedIteratorSuite]
@@ -687,8 +687,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenRowToColumnConverterSuite]
   enableSuite[GlutenSQLExecutionSuite]
   enableSuite[GlutenSQLFunctionSuite]
-  // TODO: 4.x enableSuite[GlutenSQLJsonProtocolSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenShufflePartitionsUtilSuite]  // 1 failure
+  enableSuite[GlutenSQLJsonProtocolSuite]
+  enableSuite[GlutenShufflePartitionsUtilSuite]
   // TODO: 4.x enableSuite[GlutenSimpleSQLViewSuite]  // 2 failures
   // TODO: 4.x enableSuite[GlutenSparkPlanSuite]  // 1 failure
   enableSuite[GlutenSparkPlannerSuite]
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala
index cd3aeb6438de..cd64b5e55e1f 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenExternalAppendOnlyUnsafeRowArraySuite.scala
@@ -16,8 +16,27 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.shim.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
 class GlutenExternalAppendOnlyUnsafeRowArraySuite
   extends ExternalAppendOnlyUnsafeRowArraySuite
-  with GlutenTestsTrait {}
+  with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala
index 2ca7b4380d65..f868ebfd2998 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSQLJsonProtocolSuite.scala
@@ -16,6 +16,25 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.shim.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenSQLJsonProtocolSuite extends SQLJsonProtocolSuite with GlutenTestsTrait {}
+class GlutenSQLJsonProtocolSuite extends SQLJsonProtocolSuite with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala
index 5a6595bd9eb3..f56e0cc3b8ef 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenShufflePartitionsUtilSuite.scala
@@ -16,6 +16,27 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.shim.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenShufflePartitionsUtilSuite extends ShufflePartitionsUtilSuite with GlutenTestsTrait {}
+class GlutenShufflePartitionsUtilSuite
+  extends ShufflePartitionsUtilSuite
+  with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}

From a4f74ab74affa78fa091e8bc13cb2cc5a9fe29f3 Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 06:22:07 +0000
Subject: [PATCH 03/12] [GLUTEN-11550][UT] Fix GlutenCsvExpressionsSuite

Override 'unsupported mode' test: Gluten's DataFrame-based checkEvaluation
throws AnalysisException directly instead of wrapping it in
TestFailedException. The overridden test intercepts AnalysisException.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../utils/velox/VeloxTestSettings.scala       |  3 ++-
 .../GlutenCsvExpressionsSuite.scala           | 25 +++++++++++++++++--
 .../utils/velox/VeloxTestSettings.scala       |  3 ++-
 .../GlutenCsvExpressionsSuite.scala           | 23 ++++++++++++++++-
 4 files changed, 49 insertions(+), 5 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index f94e51e2325b..68c4997e70f4 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -222,7 +222,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenCodeGeneratorWithInterpretedFallbackSuite]
   enableSuite[GlutenCollationExpressionSuite]
   enableSuite[GlutenCollationRegexpExpressionsSuite]
-  // TODO: 4.x enableSuite[GlutenCsvExpressionsSuite]  // failures with GlutenPlugin
+  enableSuite[GlutenCsvExpressionsSuite]
+    .exclude("unsupported mode")
   enableSuite[GlutenDynamicPruningSubquerySuite]
   enableSuite[GlutenExprIdSuite]
   // TODO: 4.x enableSuite[GlutenExpressionEvalHelperSuite]  // 2 failures
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
index 02c0dd69dfd7..19e3724823b2 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
@@ -16,6 +16,27 @@
  */
 package org.apache.spark.sql.catalyst.expressions
 
-import org.apache.spark.sql.GlutenTestsTrait
+import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.util.DateTimeTestUtils.UTC_OPT
+import org.apache.spark.sql.shim.GlutenTestsTrait
+import org.apache.spark.sql.types.{DoubleType, StructField, StructType}
 
-class GlutenCsvExpressionsSuite extends CsvExpressionsSuite with GlutenTestsTrait {}
+class GlutenCsvExpressionsSuite extends CsvExpressionsSuite with GlutenTestsTrait {
+
+  // Gluten's checkEvaluation (DataFrame-based) throws AnalysisException directly,
+  // not wrapped in TestFailedException as the codegen/interpreted path does.
+  testGluten("unsupported mode - gluten") {
+    val csvData = "---"
+    val schema = StructType(StructField("a", DoubleType) :: Nil)
+    checkError(
+      exception = intercept[AnalysisException] {
+        checkEvaluation(
+          CsvToStructs(schema, Map("mode" -> "DROPMALFORMED"), Literal(csvData), UTC_OPT),
+          InternalRow(null))
+      },
+      condition = "PARSE_MODE_UNSUPPORTED",
+      parameters = Map("funcName" -> "`from_csv`", "mode" -> "DROPMALFORMED")
+    )
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 1ffccf3e9852..674668157141 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -233,7 +233,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenCodeGeneratorWithInterpretedFallbackSuite]
   enableSuite[GlutenCollationExpressionSuite]
   // TODO: 4.x enableSuite[GlutenCollationRegexpExpressionsSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenCsvExpressionsSuite]  // failures with GlutenPlugin
+  enableSuite[GlutenCsvExpressionsSuite]
+    .exclude("unsupported mode")
   enableSuite[GlutenDynamicPruningSubquerySuite]
   enableSuite[GlutenExprIdSuite]
   // TODO: 4.x enableSuite[GlutenExpressionEvalHelperSuite]  // 2 failures
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
index 90d2575c9d6e..19e3724823b2 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
@@ -16,6 +16,27 @@
  */
 package org.apache.spark.sql.catalyst.expressions
 
+import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.catalyst.InternalRow
+import org.apache.spark.sql.catalyst.util.DateTimeTestUtils.UTC_OPT
 import org.apache.spark.sql.shim.GlutenTestsTrait
+import org.apache.spark.sql.types.{DoubleType, StructField, StructType}
 
-class GlutenCsvExpressionsSuite extends CsvExpressionsSuite with GlutenTestsTrait {}
+class GlutenCsvExpressionsSuite extends CsvExpressionsSuite with GlutenTestsTrait {
+
+  // Gluten's checkEvaluation (DataFrame-based) throws AnalysisException directly,
+  // not wrapped in TestFailedException as the codegen/interpreted path does.
+  testGluten("unsupported mode - gluten") {
+    val csvData = "---"
+    val schema = StructType(StructField("a", DoubleType) :: Nil)
+    checkError(
+      exception = intercept[AnalysisException] {
+        checkEvaluation(
+          CsvToStructs(schema, Map("mode" -> "DROPMALFORMED"), Literal(csvData), UTC_OPT),
+          InternalRow(null))
+      },
+      condition = "PARSE_MODE_UNSUPPORTED",
+      parameters = Map("funcName" -> "`from_csv`", "mode" -> "DROPMALFORMED")
+    )
+  }
+}

From 2a2f55aac514cf64d15f650429f118cdcabb3ee9 Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 06:26:30 +0000
Subject: [PATCH 04/12] [GLUTEN-11550][UT] Fix GlutenUnsafeRowSerializerSuite

Use System.setProperty to inject GlutenPlugin into per-test SparkSessions
created by parent suite (LocalSparkSession pattern).

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../utils/velox/VeloxTestSettings.scala       |  2 +-
 .../GlutenUnsafeRowSerializerSuite.scala      | 23 +++++++++++++++++--
 .../utils/velox/VeloxTestSettings.scala       |  2 +-
 .../GlutenUnsafeRowSerializerSuite.scala      | 23 +++++++++++++++++--
 4 files changed, 44 insertions(+), 6 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 68c4997e70f4..b0fd6586ed2a 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -727,7 +727,7 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenSparkSqlParserSuite]
   enableSuite[GlutenUnsafeFixedWidthAggregationMapSuite]
   enableSuite[GlutenUnsafeKVExternalSorterSuite]
-  // TODO: 4.x enableSuite[GlutenUnsafeRowSerializerSuite]  // 1 failure
+  enableSuite[GlutenUnsafeRowSerializerSuite]
   // TODO: 4.x enableSuite[GlutenWholeStageCodegenSparkSubmitSuite]  // 1 failure
   // TODO: 4.x enableSuite[GlutenWholeStageCodegenSuite]  // 24 failures
   enableSuite[GlutenBroadcastExchangeSuite]
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala
index 39a52a35dda6..2ec6ca1a9fc7 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala
@@ -16,6 +16,25 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenUnsafeRowSerializerSuite extends UnsafeRowSerializerSuite with GlutenTestsTrait {}
+class GlutenUnsafeRowSerializerSuite extends UnsafeRowSerializerSuite with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 674668157141..f095cda483cd 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -697,7 +697,7 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenSparkSqlParserSuite]
   enableSuite[GlutenUnsafeFixedWidthAggregationMapSuite]
   enableSuite[GlutenUnsafeKVExternalSorterSuite]
-  // TODO: 4.x enableSuite[GlutenUnsafeRowSerializerSuite]  // 1 failure
+  enableSuite[GlutenUnsafeRowSerializerSuite]
   // TODO: 4.x enableSuite[GlutenWholeStageCodegenSparkSubmitSuite]  // 1 failure
   // TODO: 4.x enableSuite[GlutenWholeStageCodegenSuite]  // 24 failures
   enableSuite[GlutenBroadcastExchangeSuite]
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala
index d81f8d58e7b3..2ec6ca1a9fc7 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenUnsafeRowSerializerSuite.scala
@@ -16,6 +16,25 @@
  */
 package org.apache.spark.sql.execution
 
-import org.apache.spark.sql.shim.GlutenTestsTrait
+import org.apache.spark.sql.GlutenTestsCommonTrait
 
-class GlutenUnsafeRowSerializerSuite extends UnsafeRowSerializerSuite with GlutenTestsTrait {}
+class GlutenUnsafeRowSerializerSuite extends UnsafeRowSerializerSuite with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}

From e3a9cfedab0d090fcbd0f4e02b20cd7a410739e4 Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 06:37:12 +0000
Subject: [PATCH 05/12] [GLUTEN-11550][UT] Fix GlutenSparkPlanSuite

Override SPARK-37779 test to find VeloxColumnarToRowExec (extends
ColumnarToRowExecBase) instead of ColumnarToRowExec.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../utils/velox/VeloxTestSettings.scala       |  7 ++--
 .../sql/execution/GlutenSparkPlanSuite.scala  | 33 ++++++++++++++++++-
 .../utils/velox/VeloxTestSettings.scala       |  7 ++--
 .../sql/execution/GlutenSparkPlanSuite.scala  | 33 ++++++++++++++++++-
 4 files changed, 72 insertions(+), 8 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index b0fd6586ed2a..d7333ea83a9c 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -721,15 +721,16 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenSQLJsonProtocolSuite]
   enableSuite[GlutenShufflePartitionsUtilSuite]
   // TODO: 4.x enableSuite[GlutenSimpleSQLViewSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenSparkPlanSuite]  // 1 failure
+  enableSuite[GlutenSparkPlanSuite]
+    .exclude("SPARK-37779: ColumnarToRowExec should be canonicalizable after being (de)serialized")
   enableSuite[GlutenSparkPlannerSuite]
   enableSuite[GlutenSparkScriptTransformationSuite]
   enableSuite[GlutenSparkSqlParserSuite]
   enableSuite[GlutenUnsafeFixedWidthAggregationMapSuite]
   enableSuite[GlutenUnsafeKVExternalSorterSuite]
   enableSuite[GlutenUnsafeRowSerializerSuite]
-  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSparkSubmitSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSuite]  // 24 failures
+  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSparkSubmitSuite]  // depends on codegen path
+  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSuite]  // 24 failures: all test WholeStageCodegen which Gluten bypasses
   enableSuite[GlutenBroadcastExchangeSuite]
   enableSuite[GlutenLocalBroadcastExchangeSuite]
   enableSuite[GlutenCoalesceShufflePartitionsSuite]
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala
index a3f0a577d782..3549004e56c9 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala
@@ -16,6 +16,37 @@
  */
 package org.apache.spark.sql.execution
 
+import org.apache.gluten.execution.{ColumnarToRowExecBase => GlutenC2R}
+
 import org.apache.spark.sql.GlutenSQLTestsTrait
+import org.apache.spark.sql.internal.SQLConf
+
+class GlutenSparkPlanSuite extends SparkPlanSuite with GlutenSQLTestsTrait {
 
-class GlutenSparkPlanSuite extends SparkPlanSuite with GlutenSQLTestsTrait {}
+  testGluten(
+    "SPARK-37779: ColumnarToRowExec should be canonicalizable after being (de)serialized") {
+    withSQLConf(SQLConf.USE_V1_SOURCE_LIST.key -> "parquet") {
+      withTempPath {
+        path =>
+          spark.range(1).write.parquet(path.getAbsolutePath)
+          val df = spark.read.parquet(path.getAbsolutePath)
+          // Gluten replaces ColumnarToRowExec with VeloxColumnarToRowExec
+          val c2r = df.queryExecution.executedPlan
+            .collectFirst { case p: GlutenC2R => p }
+            .orElse(df.queryExecution.executedPlan
+              .collectFirst { case p: ColumnarToRowExec => p })
+            .get
+          try {
+            spark.range(1).foreach {
+              _ =>
+                c2r.canonicalized
+                ()
+            }
+          } catch {
+            case e: Throwable =>
+              fail("ColumnarToRow was not canonicalizable", e)
+          }
+      }
+    }
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index f095cda483cd..11fbad7f6069 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -691,15 +691,16 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenSQLJsonProtocolSuite]
   enableSuite[GlutenShufflePartitionsUtilSuite]
   // TODO: 4.x enableSuite[GlutenSimpleSQLViewSuite]  // 2 failures
-  // TODO: 4.x enableSuite[GlutenSparkPlanSuite]  // 1 failure
+  enableSuite[GlutenSparkPlanSuite]
+    .exclude("SPARK-37779: ColumnarToRowExec should be canonicalizable after being (de)serialized")
   enableSuite[GlutenSparkPlannerSuite]
   enableSuite[GlutenSparkScriptTransformationSuite]
   enableSuite[GlutenSparkSqlParserSuite]
   enableSuite[GlutenUnsafeFixedWidthAggregationMapSuite]
   enableSuite[GlutenUnsafeKVExternalSorterSuite]
   enableSuite[GlutenUnsafeRowSerializerSuite]
-  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSparkSubmitSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSuite]  // 24 failures
+  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSparkSubmitSuite]  // depends on codegen path
+  // TODO: 4.x enableSuite[GlutenWholeStageCodegenSuite]  // 24 failures: all test WholeStageCodegen which Gluten bypasses
   enableSuite[GlutenBroadcastExchangeSuite]
     .exclude("SPARK-52962: broadcast exchange should not reset metrics") // Add Gluten test
   enableSuite[GlutenLocalBroadcastExchangeSuite]
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala
index a3f0a577d782..3549004e56c9 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenSparkPlanSuite.scala
@@ -16,6 +16,37 @@
  */
 package org.apache.spark.sql.execution
 
+import org.apache.gluten.execution.{ColumnarToRowExecBase => GlutenC2R}
+
 import org.apache.spark.sql.GlutenSQLTestsTrait
+import org.apache.spark.sql.internal.SQLConf
+
+class GlutenSparkPlanSuite extends SparkPlanSuite with GlutenSQLTestsTrait {
 
-class GlutenSparkPlanSuite extends SparkPlanSuite with GlutenSQLTestsTrait {}
+  testGluten(
+    "SPARK-37779: ColumnarToRowExec should be canonicalizable after being (de)serialized") {
+    withSQLConf(SQLConf.USE_V1_SOURCE_LIST.key -> "parquet") {
+      withTempPath {
+        path =>
+          spark.range(1).write.parquet(path.getAbsolutePath)
+          val df = spark.read.parquet(path.getAbsolutePath)
+          // Gluten replaces ColumnarToRowExec with VeloxColumnarToRowExec
+          val c2r = df.queryExecution.executedPlan
+            .collectFirst { case p: GlutenC2R => p }
+            .orElse(df.queryExecution.executedPlan
+              .collectFirst { case p: ColumnarToRowExec => p })
+            .get
+          try {
+            spark.range(1).foreach {
+              _ =>
+                c2r.canonicalized
+                ()
+            }
+          } catch {
+            case e: Throwable =>
+              fail("ColumnarToRow was not canonicalizable", e)
+          }
+      }
+    }
+  }
+}

From 91e745790819e2cb44c697afd47fe9920308ffc9 Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 06:41:11 +0000
Subject: [PATCH 06/12] [GLUTEN-11550][UT] Fix GlutenGroupBasedUpdateTableSuite
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Enable suite with .exclude for 'update with NOT NULL checks' — Velox
throws VeloxUserError wrapped as SparkException instead of the expected
SparkRuntimeException. Root cause: Velox native NOT NULL check uses
different exception chain than Spark's AssertNotNull expression.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../org/apache/gluten/utils/velox/VeloxTestSettings.scala      | 3 ++-
 .../org/apache/gluten/utils/velox/VeloxTestSettings.scala      | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index d7333ea83a9c..f0b0d697b80d 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -254,7 +254,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenDataSourceV2MetricsSuite]
   enableSuite[GlutenDataSourceV2OptionSuite]
   enableSuite[GlutenDataSourceV2UtilsSuite]
-  // TODO: 4.x enableSuite[GlutenGroupBasedUpdateTableSuite]  // 1 failure
+  enableSuite[GlutenGroupBasedUpdateTableSuite]
+    .exclude("update with NOT NULL checks")
   enableSuite[GlutenMergeIntoDataFrameSuite]
   enableSuite[GlutenProcedureSuite]
   enableSuite[GlutenPushablePredicateSuite]
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 11fbad7f6069..3ebe21812060 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -265,7 +265,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenDataSourceV2MetricsSuite]
   enableSuite[GlutenDataSourceV2OptionSuite]
   enableSuite[GlutenDataSourceV2UtilsSuite]
-  // TODO: 4.x enableSuite[GlutenGroupBasedUpdateTableSuite]  // 1 failure
+  enableSuite[GlutenGroupBasedUpdateTableSuite]
+    .exclude("update with NOT NULL checks")
   enableSuite[GlutenMergeIntoDataFrameSuite]
   enableSuite[GlutenProcedureSuite]
   enableSuite[GlutenPushablePredicateSuite]

From 61a1f282b9b23d68292b3244b0062b03137c091e Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 07:23:20 +0000
Subject: [PATCH 07/12] [GLUTEN-11550][UT] Enable 6 suites with targeted
 excludes

Enable with .exclude() for specific failing tests:
- GlutenWholeTextFileV1Suite: exclude jar:file: URI test
- GlutenWholeTextFileV2Suite: exclude jar:file: URI test
- GlutenScalaUDFSuite: exclude Variant encoder test (Spark 4.1 bug)
- GlutenExpressionEvalHelperSuite: exclude 2 tests (different failure names)
- GlutenToPrettyStringSuite: exclude timestamp timezone test (Velox UTC)
- GlutenGroupBasedUpdateTableSuite: exclude NOT NULL exception type test

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../gluten/utils/velox/VeloxTestSettings.scala | 18 ++++++++++++------
 .../gluten/utils/velox/VeloxTestSettings.scala | 18 ++++++++++++------
 2 files changed, 24 insertions(+), 12 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index f0b0d697b80d..d1638cfbe53a 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -226,7 +226,9 @@ class VeloxTestSettings extends BackendTestSettings {
     .exclude("unsupported mode")
   enableSuite[GlutenDynamicPruningSubquerySuite]
   enableSuite[GlutenExprIdSuite]
-  // TODO: 4.x enableSuite[GlutenExpressionEvalHelperSuite]  // 2 failures
+  enableSuite[GlutenExpressionEvalHelperSuite]
+    .exclude("SPARK-16489: checkEvaluation should fail if expression reuses variable names")
+    .exclude("SPARK-25388: checkEvaluation should fail if nullable in DataType is incorrect")
   enableSuite[GlutenExpressionImplUtilsSuite]
   enableSuite[GlutenExpressionSQLBuilderSuite]
   enableSuite[GlutenExpressionSetSuite]
@@ -236,14 +238,16 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenNamedExpressionSuite]
   // TODO: 4.x enableSuite[GlutenObjectExpressionsSuite]  // 7 failures
   enableSuite[GlutenOrderingSuite]
-  // TODO: 4.x enableSuite[GlutenScalaUDFSuite]  // 1 failure
+  enableSuite[GlutenScalaUDFSuite]
+    .exclude("variant basic output variant")
   enableSuite[GlutenSchemaPruningSuite]
   enableSuite[GlutenSelectedFieldSuite]
   // GlutenSubExprEvaluationRuntimeSuite is removed because SubExprEvaluationRuntimeSuite
   // is in test-jar without shaded Guava, while SubExprEvaluationRuntime is shaded.
   enableSuite[GlutenSubexpressionEliminationSuite]
   enableSuite[GlutenTimeWindowSuite]
-  // TODO: 4.x enableSuite[GlutenToPrettyStringSuite]  // 1 failure
+  enableSuite[GlutenToPrettyStringSuite]
+    .exclude("Timestamp as pretty strings")
   enableSuite[GlutenUnsafeRowConverterSuite]
   enableSuite[GlutenUnwrapUDTExpressionSuite]
   enableSuite[GlutenV2ExpressionUtilsSuite]
@@ -394,8 +398,10 @@ class VeloxTestSettings extends BackendTestSettings {
     .exclude("parquet widening conversion ShortType -> DoubleType")
   enableSuite[GlutenParquetVariantShreddingSuite]
   // Generated suites for org.apache.spark.sql.execution.datasources.text
-  // TODO: 4.x enableSuite[GlutenWholeTextFileV1Suite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenWholeTextFileV2Suite]  // 1 failure
+  enableSuite[GlutenWholeTextFileV1Suite]
+    .exclude("reading text file with option wholetext=true")
+  enableSuite[GlutenWholeTextFileV2Suite]
+    .exclude("reading text file with option wholetext=true")
   // Generated suites for org.apache.spark.sql.execution.datasources.v2
   enableSuite[GlutenFileWriterFactorySuite]
   enableSuite[GlutenV2SessionCatalogNamespaceSuite]
@@ -1096,7 +1102,7 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenFallbackSuite]
   enableSuite[GlutenHiveSQLQuerySuite]
   enableSuite[GlutenCollapseProjectExecTransformerSuite]
-  // TODO: 4.x enableSuite[GlutenSparkSessionExtensionSuite]  // 1 failure
+  // TODO: 4.x enableSuite[GlutenSparkSessionExtensionSuite]  // GlutenPlugin interferes with custom session extensions
   enableSuite[GlutenGroupBasedDeleteFromTableSuite]
   enableSuite[GlutenDeltaBasedDeleteFromTableSuite]
   enableSuite[GlutenDataFrameToSchemaSuite]
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 3ebe21812060..c69638f0968b 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -237,7 +237,9 @@ class VeloxTestSettings extends BackendTestSettings {
     .exclude("unsupported mode")
   enableSuite[GlutenDynamicPruningSubquerySuite]
   enableSuite[GlutenExprIdSuite]
-  // TODO: 4.x enableSuite[GlutenExpressionEvalHelperSuite]  // 2 failures
+  enableSuite[GlutenExpressionEvalHelperSuite]
+    .exclude("SPARK-16489: checkEvaluation should fail if expression reuses variable names")
+    .exclude("SPARK-25388: checkEvaluation should fail if nullable in DataType is incorrect")
   enableSuite[GlutenExpressionImplUtilsSuite]
   enableSuite[GlutenExpressionSQLBuilderSuite]
   enableSuite[GlutenExpressionSetSuite]
@@ -247,14 +249,16 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenNamedExpressionSuite]
   // TODO: 4.x enableSuite[GlutenObjectExpressionsSuite]  // 7 failures
   // TODO: 4.x enableSuite[GlutenOrderingSuite]  // 2 failures
-  // TODO: 4.x enableSuite[GlutenScalaUDFSuite]  // 1 failure
+  enableSuite[GlutenScalaUDFSuite]
+    .exclude("variant basic output variant")
   enableSuite[GlutenSchemaPruningSuite]
   enableSuite[GlutenSelectedFieldSuite]
   // GlutenSubExprEvaluationRuntimeSuite is removed because SubExprEvaluationRuntimeSuite
   // is in test-jar without shaded Guava, while SubExprEvaluationRuntime is shaded.
   enableSuite[GlutenSubexpressionEliminationSuite]
   enableSuite[GlutenTimeWindowSuite]
-  // TODO: 4.x enableSuite[GlutenToPrettyStringSuite]  // 1 failure
+  enableSuite[GlutenToPrettyStringSuite]
+    .exclude("Timestamp as pretty strings")
   enableSuite[GlutenUnsafeRowConverterSuite]
   enableSuite[GlutenUnwrapUDTExpressionSuite]
   enableSuite[GlutenV2ExpressionUtilsSuite]
@@ -405,8 +409,10 @@ class VeloxTestSettings extends BackendTestSettings {
     .exclude("parquet widening conversion ShortType -> DoubleType")
   enableSuite[GlutenParquetVariantShreddingSuite]
   // Generated suites for org.apache.spark.sql.execution.datasources.text
-  // TODO: 4.x enableSuite[GlutenWholeTextFileV1Suite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenWholeTextFileV2Suite]  // 1 failure
+  enableSuite[GlutenWholeTextFileV1Suite]
+    .exclude("reading text file with option wholetext=true")
+  enableSuite[GlutenWholeTextFileV2Suite]
+    .exclude("reading text file with option wholetext=true")
   // Generated suites for org.apache.spark.sql.execution.datasources.v2
   enableSuite[GlutenFileWriterFactorySuite]
   enableSuite[GlutenV2SessionCatalogNamespaceSuite]
@@ -1087,7 +1093,7 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenFallbackSuite]
   enableSuite[GlutenHiveSQLQuerySuite]
   enableSuite[GlutenCollapseProjectExecTransformerSuite]
-  // TODO: 4.x enableSuite[GlutenSparkSessionExtensionSuite]  // 1 failure
+  // TODO: 4.x enableSuite[GlutenSparkSessionExtensionSuite]  // GlutenPlugin interferes with custom session extensions
   enableSuite[GlutenGroupBasedDeleteFromTableSuite]
   enableSuite[GlutenDeltaBasedDeleteFromTableSuite]
   enableSuite[GlutenDataFrameToSchemaSuite]

From 86801673a7388a0bbe58c3326b5709dc4fe2c34e Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 09:15:59 +0000
Subject: [PATCH 08/12] [GLUTEN-11550][UT] Enable 11 more suites with targeted
 excludes

Enable plan-structure and other suites with .exclude() for failing tests:

| Suite | Passed | Excluded | Root Cause |
|-------|:------:|:--------:|------------|
| GlutenJoinHintSuite | 17 | 1 | CartesianProduct not supported |
| GlutenExplainSuite | 20 | 4 | WholeStageCodegen/FileScan in explain |
| GlutenDataSourceScanExecRedactionSuite | 2 | 2 | FileScan replaced by native scan |
| GlutenDataSourceV2ScanExecRedactionSuite | 1 | 2 | BatchScan replaced |
| GlutenInsertSortForLimitAndOffsetSuite | 0 | 6 | TakeOrderedAndProject replaced |
| GlutenProjectedOrderingAndPartitioningSuite | 1 | 9 | SinglePartition vs HashPartitioning |
| GlutenRemoveRedundantProjectsSuite | 3 | 14 | Plan tree structure differs |
| GlutenSimpleSQLViewSuite | 52 | 2 | Error condition + query result |
| GlutenPlannerSuite | 55 | 21 | TakeOrderedAndProject/sort/partitioning |
| GlutenRemoveRedundantSortsSuite | 0 | 5 | SortExec replaced |
| GlutenObjectExpressionsSuite | 13 | 15 | Spark 4.1 encoder API change |

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../utils/velox/VeloxTestSettings.scala       | 77 ++++++++++++++++---
 .../utils/velox/VeloxTestSettings.scala       | 77 ++++++++++++++++---
 2 files changed, 130 insertions(+), 24 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index d1638cfbe53a..a42167392a1d 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -236,7 +236,10 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenHexSuite]
   enableSuite[GlutenMutableProjectionSuite]
   enableSuite[GlutenNamedExpressionSuite]
-  // TODO: 4.x enableSuite[GlutenObjectExpressionsSuite]  // 7 failures
+  enableSuite[GlutenObjectExpressionsSuite]
+    .excludeByPrefix("SPARK-2359")
+    .excludeByPrefix("SPARK-2358")
+    .exclude("LambdaVariable should support interpreted execution")
   enableSuite[GlutenOrderingSuite]
   enableSuite[GlutenScalaUDFSuite]
     .exclude("variant basic output variant")
@@ -704,30 +707,75 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenAggregatingAccumulatorSuite]
   enableSuite[GlutenCoGroupedIteratorSuite]
   enableSuite[GlutenColumnarRulesSuite]
-  // TODO: 4.x enableSuite[GlutenDataSourceScanExecRedactionSuite]  // 2 failures
-  // TODO: 4.x enableSuite[GlutenDataSourceV2ScanExecRedactionSuite]  // 2 failures
+  enableSuite[GlutenDataSourceScanExecRedactionSuite]
+    .exclude("explain is redacted using SQLConf")
+    .exclude("SPARK-31793: FileSourceScanExec metadata should contain limited file paths")
+  enableSuite[GlutenDataSourceV2ScanExecRedactionSuite]
+    .exclude("explain is redacted using SQLConf")
+    .exclude("FileScan description")
   enableSuite[GlutenExecuteImmediateEndToEndSuite]
   enableSuite[GlutenExternalAppendOnlyUnsafeRowArraySuite]
   enableSuite[GlutenGlobalTempViewSuite]
   enableSuite[GlutenGlobalTempViewTestSuite]
   enableSuite[GlutenGroupedIteratorSuite]
   enableSuite[GlutenHiveResultSuite]
-  // TODO: 4.x enableSuite[GlutenInsertSortForLimitAndOffsetSuite]  // 6 failures
+  enableSuite[GlutenInsertSortForLimitAndOffsetSuite]
+    .exclude("root LIMIT preserves data ordering with top-K sort")
+    .exclude("middle LIMIT preserves data ordering with top-K sort")
+    .exclude("root LIMIT preserves data ordering with CollectLimitExec")
+    .exclude("middle LIMIT preserves data ordering with the extra sort")
+    .exclude("root OFFSET preserves data ordering with CollectLimitExec")
+    .exclude("middle OFFSET preserves data ordering with the extra sort")
   enableSuite[GlutenLocalTempViewTestSuite]
   // TODO: 4.x enableSuite[GlutenLogicalPlanTagInSparkPlanSuite]  // RUN ABORTED
   enableSuite[GlutenOptimizeMetadataOnlyQuerySuite]
   enableSuite[GlutenPersistedViewTestSuite]
-  // TODO: 4.x enableSuite[GlutenPlannerSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenProjectedOrderingAndPartitioningSuite]  // 6 failures
+  enableSuite[GlutenPlannerSuite]
+    .excludeByPrefix("efficient terminal limit")
+    .excludeByPrefix("terminal limit -> project -> sort")
+    .excludeByPrefix("TakeOrderedAndProject can appear")
+    .excludeByPrefix("TakeOrderedAndProjectExec appears only")
+    .excludeByPrefix("SPARK-24242")
+    .excludeByPrefix("SPARK-24556")
+    .excludeByPrefix("SPARK-33399")
+    .excludeByPrefix("SPARK-33400")
+    .excludeByPrefix("sort order doesn't have repeated")
+    .excludeByPrefix("aliases to expressions should not be replaced")
+    .excludeByPrefix("aliases in the object hash")
+    .excludeByPrefix("SPARK-33758")
+    .excludeByPrefix("SPARK-40086")
+  enableSuite[GlutenProjectedOrderingAndPartitioningSuite]
+    .excludeByPrefix("SPARK-42049")
   enableSuite[GlutenQueryPlanningTrackerEndToEndSuite]
-  // TODO: 4.x enableSuite[GlutenRemoveRedundantProjectsSuite]  // 14 failures
-  // TODO: 4.x enableSuite[GlutenRemoveRedundantSortsSuite]  // 1 failure
+  enableSuite[GlutenRemoveRedundantProjectsSuite]
+    .exclude("project with filter")
+    .exclude("project with specific column ordering")
+    .exclude("project with extra columns")
+    .exclude("project with fewer columns")
+    .exclude("aggregate without ordering requirement")
+    .exclude("aggregate with ordering requirement")
+    .exclude("join without ordering requirement")
+    .exclude("join with ordering requirement")
+    .exclude("window function")
+    .exclude("generate should require column ordering")
+    .exclude("subquery")
+    .exclude("SPARK-33697: UnionExec should require column ordering")
+    .exclude("SPARK-33697: remove redundant projects under expand")
+    .exclude("SPARK-36020: Project should not be removed when child's logical link is different")
+  enableSuite[GlutenRemoveRedundantSortsSuite]
+    .exclude("cached sorted data doesn't need to be re-sorted")
+    .exclude("SPARK-33472: shuffled join with different left and right side partition numbers")
+    .exclude("remove redundant sorts with limit")
+    .exclude("remove redundant sorts with broadcast hash join")
+    .exclude("remove redundant sorts with sort merge join")
   enableSuite[GlutenRowToColumnConverterSuite]
   enableSuite[GlutenSQLExecutionSuite]
   enableSuite[GlutenSQLFunctionSuite]
   enableSuite[GlutenSQLJsonProtocolSuite]
   enableSuite[GlutenShufflePartitionsUtilSuite]
-  // TODO: 4.x enableSuite[GlutenSimpleSQLViewSuite]  // 1 failure
+  enableSuite[GlutenSimpleSQLViewSuite]
+    .exclude("alter temporary view should follow current storeAnalyzedPlanForView config")
+    .exclude("SPARK-53968 reading the view after allowPrecisionLoss is changed")
   enableSuite[GlutenSparkPlanSuite]
     .exclude("SPARK-37779: ColumnarToRowExec should be canonicalizable after being (de)serialized")
   enableSuite[GlutenSparkPlannerSuite]
@@ -834,10 +882,15 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenDataFrameTransposeSuite]
   enableSuite[GlutenDefaultANSIValueSuite]
   enableSuite[GlutenDeprecatedDatasetAggregatorSuite]
-  // TODO: 4.x enableSuite[GlutenExplainSuite]  // 1 failure
+  enableSuite[GlutenExplainSuite]
+    .exclude("SPARK-33853: explain codegen - check presence of subquery")
+    .exclude("explain formatted - check presence of subquery in case of DPP")
+    .exclude("Support ExplainMode in Dataset.explain")
+    .exclude("Explain formatted output for scan operator for datasource V2")
   enableSuite[GlutenICUCollationsMapSuite]
   enableSuite[GlutenInlineTableParsingImprovementsSuite]
-  // TODO: 4.x enableSuite[GlutenJoinHintSuite]  // 1 failure
+  enableSuite[GlutenJoinHintSuite]
+    .exclude("join strategy hint - shuffle-replicate-nl")
   enableSuite[GlutenLogQuerySuite]
     // Overridden
     .exclude("Query Spark logs with exception using SQL")
@@ -848,7 +901,7 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenRuntimeConfigSuite]
   enableSuite[GlutenSSBQuerySuite]
   enableSuite[GlutenSessionStateSuite]
-  // TODO: 4.x enableSuite[GlutenSetCommandSuite]  // 1 failure
+  // TODO: 4.x enableSuite[GlutenSetCommandSuite]  // hive-site.xml hadoop conf not loaded
   enableSuite[GlutenSparkSessionBuilderSuite]
   enableSuite[GlutenSparkSessionJobTaggingAndCancellationSuite]
   enableSuite[GlutenTPCDSCollationQueryTestSuite]
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index c69638f0968b..2760e846d731 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -247,7 +247,10 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenHexSuite]
   enableSuite[GlutenMutableProjectionSuite]
   enableSuite[GlutenNamedExpressionSuite]
-  // TODO: 4.x enableSuite[GlutenObjectExpressionsSuite]  // 7 failures
+  enableSuite[GlutenObjectExpressionsSuite]
+    .excludeByPrefix("SPARK-2359")
+    .excludeByPrefix("SPARK-2358")
+    .exclude("LambdaVariable should support interpreted execution")
   // TODO: 4.x enableSuite[GlutenOrderingSuite]  // 2 failures
   enableSuite[GlutenScalaUDFSuite]
     .exclude("variant basic output variant")
@@ -674,30 +677,75 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenAggregatingAccumulatorSuite]
   enableSuite[GlutenCoGroupedIteratorSuite]
   // TODO: 4.x enableSuite[GlutenColumnarRulesSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenDataSourceScanExecRedactionSuite]  // 2 failures
-  // TODO: 4.x enableSuite[GlutenDataSourceV2ScanExecRedactionSuite]  // 2 failures
+  enableSuite[GlutenDataSourceScanExecRedactionSuite]
+    .exclude("explain is redacted using SQLConf")
+    .exclude("SPARK-31793: FileSourceScanExec metadata should contain limited file paths")
+  enableSuite[GlutenDataSourceV2ScanExecRedactionSuite]
+    .exclude("explain is redacted using SQLConf")
+    .exclude("FileScan description")
   enableSuite[GlutenExecuteImmediateEndToEndSuite]
   enableSuite[GlutenExternalAppendOnlyUnsafeRowArraySuite]
   enableSuite[GlutenGlobalTempViewSuite]
   enableSuite[GlutenGlobalTempViewTestSuite]
   enableSuite[GlutenGroupedIteratorSuite]
   // TODO: 4.x enableSuite[GlutenHiveResultSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenInsertSortForLimitAndOffsetSuite]  // 6 failures
+  enableSuite[GlutenInsertSortForLimitAndOffsetSuite]
+    .exclude("root LIMIT preserves data ordering with top-K sort")
+    .exclude("middle LIMIT preserves data ordering with top-K sort")
+    .exclude("root LIMIT preserves data ordering with CollectLimitExec")
+    .exclude("middle LIMIT preserves data ordering with the extra sort")
+    .exclude("root OFFSET preserves data ordering with CollectLimitExec")
+    .exclude("middle OFFSET preserves data ordering with the extra sort")
   enableSuite[GlutenLocalTempViewTestSuite]
   // TODO: 4.x enableSuite[GlutenLogicalPlanTagInSparkPlanSuite]  // RUN ABORTED
   enableSuite[GlutenOptimizeMetadataOnlyQuerySuite]
   enableSuite[GlutenPersistedViewTestSuite]
-  // TODO: 4.x enableSuite[GlutenPlannerSuite]  // 1 failure
-  // TODO: 4.x enableSuite[GlutenProjectedOrderingAndPartitioningSuite]  // 6 failures
+  enableSuite[GlutenPlannerSuite]
+    .excludeByPrefix("efficient terminal limit")
+    .excludeByPrefix("terminal limit -> project -> sort")
+    .excludeByPrefix("TakeOrderedAndProject can appear")
+    .excludeByPrefix("TakeOrderedAndProjectExec appears only")
+    .excludeByPrefix("SPARK-24242")
+    .excludeByPrefix("SPARK-24556")
+    .excludeByPrefix("SPARK-33399")
+    .excludeByPrefix("SPARK-33400")
+    .excludeByPrefix("sort order doesn't have repeated")
+    .excludeByPrefix("aliases to expressions should not be replaced")
+    .excludeByPrefix("aliases in the object hash")
+    .excludeByPrefix("SPARK-33758")
+    .excludeByPrefix("SPARK-40086")
+  enableSuite[GlutenProjectedOrderingAndPartitioningSuite]
+    .excludeByPrefix("SPARK-42049")
   enableSuite[GlutenQueryPlanningTrackerEndToEndSuite]
-  // TODO: 4.x enableSuite[GlutenRemoveRedundantProjectsSuite]  // 14 failures
-  // TODO: 4.x enableSuite[GlutenRemoveRedundantSortsSuite]  // 1 failure
+  enableSuite[GlutenRemoveRedundantProjectsSuite]
+    .exclude("project with filter")
+    .exclude("project with specific column ordering")
+    .exclude("project with extra columns")
+    .exclude("project with fewer columns")
+    .exclude("aggregate without ordering requirement")
+    .exclude("aggregate with ordering requirement")
+    .exclude("join without ordering requirement")
+    .exclude("join with ordering requirement")
+    .exclude("window function")
+    .exclude("generate should require column ordering")
+    .exclude("subquery")
+    .exclude("SPARK-33697: UnionExec should require column ordering")
+    .exclude("SPARK-33697: remove redundant projects under expand")
+    .exclude("SPARK-36020: Project should not be removed when child's logical link is different")
+  enableSuite[GlutenRemoveRedundantSortsSuite]
+    .exclude("cached sorted data doesn't need to be re-sorted")
+    .exclude("SPARK-33472: shuffled join with different left and right side partition numbers")
+    .exclude("remove redundant sorts with limit")
+    .exclude("remove redundant sorts with broadcast hash join")
+    .exclude("remove redundant sorts with sort merge join")
   enableSuite[GlutenRowToColumnConverterSuite]
   enableSuite[GlutenSQLExecutionSuite]
   enableSuite[GlutenSQLFunctionSuite]
   enableSuite[GlutenSQLJsonProtocolSuite]
   enableSuite[GlutenShufflePartitionsUtilSuite]
-  // TODO: 4.x enableSuite[GlutenSimpleSQLViewSuite]  // 2 failures
+  enableSuite[GlutenSimpleSQLViewSuite]
+    .exclude("alter temporary view should follow current storeAnalyzedPlanForView config")
+    .exclude("SPARK-53968 reading the view after allowPrecisionLoss is changed")
   enableSuite[GlutenSparkPlanSuite]
     .exclude("SPARK-37779: ColumnarToRowExec should be canonicalizable after being (de)serialized")
   enableSuite[GlutenSparkPlannerSuite]
@@ -805,10 +853,15 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenDataFrameTableValuedFunctionsSuite]
   enableSuite[GlutenDataFrameTransposeSuite]
   enableSuite[GlutenDeprecatedDatasetAggregatorSuite]
-  // TODO: 4.x enableSuite[GlutenExplainSuite]  // 1 failure
+  enableSuite[GlutenExplainSuite]
+    .exclude("SPARK-33853: explain codegen - check presence of subquery")
+    .exclude("explain formatted - check presence of subquery in case of DPP")
+    .exclude("Support ExplainMode in Dataset.explain")
+    .exclude("Explain formatted output for scan operator for datasource V2")
   enableSuite[GlutenICUCollationsMapSuite]
   enableSuite[GlutenInlineTableParsingImprovementsSuite]
-  // TODO: 4.x enableSuite[GlutenJoinHintSuite]  // 1 failure
+  enableSuite[GlutenJoinHintSuite]
+    .exclude("join strategy hint - shuffle-replicate-nl")
   enableSuite[GlutenLogQuerySuite]
     // Overridden
     .exclude("Query Spark logs with exception using SQL")
@@ -819,7 +872,7 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenRuntimeConfigSuite]
   enableSuite[GlutenSSBQuerySuite]
   enableSuite[GlutenSessionStateSuite]
-  // TODO: 4.x enableSuite[GlutenSetCommandSuite]  // 1 failure
+  // TODO: 4.x enableSuite[GlutenSetCommandSuite]  // hive-site.xml hadoop conf not loaded
   enableSuite[GlutenSparkSessionBuilderSuite]
   enableSuite[GlutenSparkSessionJobTaggingAndCancellationSuite]
   enableSuite[GlutenTPCDSCollationQueryTestSuite]

From 08f6890b4b7a023d9b0971936123c461c9112ab5 Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 09:27:59 +0000
Subject: [PATCH 09/12] [GLUTEN-11550][UT] Enable 5 spark41-only suites with
 TimeType/native-engine excludes

- GlutenOrderingSuite: 54 passed, 2 TimeType excluded
- GlutenHiveResultSuite: 10 passed, 1 TimeType excluded
- GlutenCollationRegexpExpressionsSuite: 3 passed, 1 Velox split excluded
- GlutenColumnarRulesSuite: 2 passed, 1 Transition excluded
- RandomDataGeneratorSuite: kept TODO (232 TimeType failures, impractical to exclude individually)

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../gluten/utils/velox/VeloxTestSettings.scala     | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index 2760e846d731..fc2d4521e7f7 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -232,7 +232,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenCodeGenerationSuite]
   enableSuite[GlutenCodeGeneratorWithInterpretedFallbackSuite]
   enableSuite[GlutenCollationExpressionSuite]
-  // TODO: 4.x enableSuite[GlutenCollationRegexpExpressionsSuite]  // 1 failure
+  enableSuite[GlutenCollationRegexpExpressionsSuite]
+    .exclude("StringSplit expression with collated strings")
   enableSuite[GlutenCsvExpressionsSuite]
     .exclude("unsupported mode")
   enableSuite[GlutenDynamicPruningSubquerySuite]
@@ -251,7 +252,8 @@ class VeloxTestSettings extends BackendTestSettings {
     .excludeByPrefix("SPARK-2359")
     .excludeByPrefix("SPARK-2358")
     .exclude("LambdaVariable should support interpreted execution")
-  // TODO: 4.x enableSuite[GlutenOrderingSuite]  // 2 failures
+  enableSuite[GlutenOrderingSuite]
+    .excludeByPrefix("GenerateOrdering with TimeType")
   enableSuite[GlutenScalaUDFSuite]
     .exclude("variant basic output variant")
   enableSuite[GlutenSchemaPruningSuite]
@@ -676,7 +678,8 @@ class VeloxTestSettings extends BackendTestSettings {
   // Generated suites for org.apache.spark.sql.execution
   enableSuite[GlutenAggregatingAccumulatorSuite]
   enableSuite[GlutenCoGroupedIteratorSuite]
-  // TODO: 4.x enableSuite[GlutenColumnarRulesSuite]  // 1 failure
+  enableSuite[GlutenColumnarRulesSuite]
+    .excludeByPrefix("SPARK-51474")
   enableSuite[GlutenDataSourceScanExecRedactionSuite]
     .exclude("explain is redacted using SQLConf")
     .exclude("SPARK-31793: FileSourceScanExec metadata should contain limited file paths")
@@ -688,7 +691,8 @@ class VeloxTestSettings extends BackendTestSettings {
   enableSuite[GlutenGlobalTempViewSuite]
   enableSuite[GlutenGlobalTempViewTestSuite]
   enableSuite[GlutenGroupedIteratorSuite]
-  // TODO: 4.x enableSuite[GlutenHiveResultSuite]  // 1 failure
+  enableSuite[GlutenHiveResultSuite]
+    .exclude("time formatting in hive result")
   enableSuite[GlutenInsertSortForLimitAndOffsetSuite]
     .exclude("root LIMIT preserves data ordering with top-K sort")
     .exclude("middle LIMIT preserves data ordering with top-K sort")
@@ -866,7 +870,7 @@ class VeloxTestSettings extends BackendTestSettings {
     // Overridden
     .exclude("Query Spark logs with exception using SQL")
   enableSuite[GlutenPercentileQuerySuite]
-  // TODO: 4.x enableSuite[GlutenRandomDataGeneratorSuite]  // 232 failures
+  // TODO: 4.x enableSuite[GlutenRandomDataGeneratorSuite]  // 232 TimeType failures, need Velox C++ support
   enableSuite[GlutenRowJsonSuite]
   enableSuite[GlutenRowSuite]
   enableSuite[GlutenRuntimeConfigSuite]

From 3de26edec0655365939729dce044f72f884d9077 Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Tue, 24 Mar 2026 13:37:01 +0000
Subject: [PATCH 10/12] Fix spark40 CsvExpressionsSuite compilation: use
 correct GlutenTestsTrait import

spark40 does not have org.apache.spark.sql.shim.GlutenTestsTrait (that shim
only exists for spark41). Use org.apache.spark.sql.GlutenTestsTrait instead.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
index 19e3724823b2..a2d2e1bc624c 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/catalyst/expressions/GlutenCsvExpressionsSuite.scala
@@ -17,9 +17,9 @@
 package org.apache.spark.sql.catalyst.expressions
 
 import org.apache.spark.sql.AnalysisException
+import org.apache.spark.sql.GlutenTestsTrait
 import org.apache.spark.sql.catalyst.InternalRow
 import org.apache.spark.sql.catalyst.util.DateTimeTestUtils.UTC_OPT
-import org.apache.spark.sql.shim.GlutenTestsTrait
 import org.apache.spark.sql.types.{DoubleType, StructField, StructType}
 
 class GlutenCsvExpressionsSuite extends CsvExpressionsSuite with GlutenTestsTrait {

From 451760d2bbd20eaba9a64b8b42e8f67ffc27f59a Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Wed, 25 Mar 2026 06:40:36 +0000
Subject: [PATCH 11/12] Enable GlutenLogicalPlanTagInSparkPlanSuite (150/150
 tests)

Root cause: Gluten's offload rules replace Spark physical plan nodes with
Transformer nodes but don't propagate LOGICAL_PLAN_TAG. This tag is used by
Spark's LogicalPlanTagInSparkPlanSuite to verify logical-physical plan linkage.

Three core fixes:
1. LegacyOffload: propagate LOGICAL_PLAN_TAG from original node to offloaded
   Transformer node using setTagValue (non-recursive to avoid tagging Exchange).
2. HeuristicTransform.Simple: same tag propagation for the simple offload path.
3. PushDownFilterToScan: copyTagsFrom when creating new scan via
   withNewPushdownFilters (case class copy loses tags).

Test suite overrides checkGeneratedCode with Gluten-aware version that:
- Recognizes Transformer node types (joins, aggregates, windows, scans, etc.)
- For scan trees, finds logical plan tag from any node in the tree (not just
  root), since rewrite rules may create new Project/Filter without tags.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../heuristic/HeuristicTransform.scala        |   8 +-
 .../columnar/heuristic/LegacyOffload.scala    |  17 +-
 .../columnar/PushDownFilterToScan.scala       |   1 +
 .../utils/velox/VeloxTestSettings.scala       |   2 +-
 ...GlutenLogicalPlanTagInSparkPlanSuite.scala | 170 +++++++++++++++++-
 .../utils/velox/VeloxTestSettings.scala       |   2 +-
 ...GlutenLogicalPlanTagInSparkPlanSuite.scala | 170 +++++++++++++++++-
 7 files changed, 364 insertions(+), 6 deletions(-)

diff --git a/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/HeuristicTransform.scala b/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/HeuristicTransform.scala
index b3051953740f..8b070083a2e4 100644
--- a/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/HeuristicTransform.scala
+++ b/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/HeuristicTransform.scala
@@ -81,7 +81,13 @@ object HeuristicTransform {
             node =>
               validator.validate(node) match {
                 case Validator.Passed =>
-                  rule.offload(node)
+                  val offloaded = rule.offload(node)
+                  if (offloaded ne node) {
+                    node.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).foreach {
+                      lp => offloaded.setTagValue(SparkPlan.LOGICAL_PLAN_TAG, lp)
+                    }
+                  }
+                  offloaded
                 case Validator.Failed(reason) =>
                   logDebug(s"Validation failed by reason: $reason on query plan: ${node.nodeName}")
                   if (FallbackTags.maybeOffloadable(node)) {
diff --git a/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/LegacyOffload.scala b/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/LegacyOffload.scala
index c0c44f390d29..d24616ed1a56 100644
--- a/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/LegacyOffload.scala
+++ b/gluten-core/src/main/scala/org/apache/gluten/extension/columnar/heuristic/LegacyOffload.scala
@@ -25,7 +25,22 @@ import org.apache.spark.sql.execution.SparkPlan
 class LegacyOffload(rules: Seq[OffloadSingleNode]) extends Rule[SparkPlan] with LogLevelUtil {
   def apply(plan: SparkPlan): SparkPlan = {
     val out =
-      rules.foldLeft(plan)((p, rule) => p.transformUp { case p => rule.offload(p) })
+      rules.foldLeft(plan) {
+        (p, rule) =>
+          p.transformUp {
+            case node =>
+              val offloaded = rule.offload(node)
+              if (offloaded ne node) {
+                // Propagate logical plan tag from original to offloaded node (non-recursive).
+                // Using setTagValue directly to avoid setLogicalLink's recursive propagation
+                // to children, which would incorrectly tag Exchange nodes.
+                node.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).foreach {
+                  lp => offloaded.setTagValue(SparkPlan.LOGICAL_PLAN_TAG, lp)
+                }
+              }
+              offloaded
+          }
+      }
     out
   }
 }
diff --git a/gluten-substrait/src/main/scala/org/apache/gluten/extension/columnar/PushDownFilterToScan.scala b/gluten-substrait/src/main/scala/org/apache/gluten/extension/columnar/PushDownFilterToScan.scala
index 9a6e271b35ac..b9e02461b1fb 100644
--- a/gluten-substrait/src/main/scala/org/apache/gluten/extension/columnar/PushDownFilterToScan.scala
+++ b/gluten-substrait/src/main/scala/org/apache/gluten/extension/columnar/PushDownFilterToScan.scala
@@ -36,6 +36,7 @@ object PushDownFilterToScan extends Rule[SparkPlan] with PredicateHelper {
               scan) && scan.supportPushDownFilters =>
           val newScan = scan.withNewPushdownFilters(splitConjunctivePredicates(filter.cond))
           if (newScan.doValidate().ok()) {
+            newScan.copyTagsFrom(scan)
             filter.withNewChildren(Seq(newScan))
           } else {
             filter
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index a42167392a1d..cc4e5ed0993f 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -727,7 +727,7 @@ class VeloxTestSettings extends BackendTestSettings {
     .exclude("root OFFSET preserves data ordering with CollectLimitExec")
     .exclude("middle OFFSET preserves data ordering with the extra sort")
   enableSuite[GlutenLocalTempViewTestSuite]
-  // TODO: 4.x enableSuite[GlutenLogicalPlanTagInSparkPlanSuite]  // RUN ABORTED
+  enableSuite[GlutenLogicalPlanTagInSparkPlanSuite]
   enableSuite[GlutenOptimizeMetadataOnlyQuerySuite]
   enableSuite[GlutenPersistedViewTestSuite]
   enableSuite[GlutenPlannerSuite]
diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala
index 297d3b2a3428..a01c81a08fa3 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala
@@ -16,8 +16,176 @@
  */
 package org.apache.spark.sql.execution
 
+import org.apache.gluten.execution._
+
 import org.apache.spark.sql.GlutenSQLTestsTrait
+import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, Complete, Final}
+import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.execution.columnar.InMemoryTableScanExec
+import org.apache.spark.sql.execution.datasources.LogicalRelation
+import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
+import org.apache.spark.sql.execution.exchange.ReusedExchangeExec
+
+import scala.reflect.ClassTag
 
 class GlutenLogicalPlanTagInSparkPlanSuite
   extends LogicalPlanTagInSparkPlanSuite
-  with GlutenSQLTestsTrait {}
+  with GlutenSQLTestsTrait {
+
+  // Override to use Gluten-aware logical plan tag checking.
+  // Gluten replaces Spark physical operators with Transformer nodes that don't match
+  // the original Spark pattern matching in LogicalPlanTagInSparkPlanSuite.
+  override protected def checkGeneratedCode(
+      plan: SparkPlan,
+      checkMethodCodeSize: Boolean = true): Unit = {
+    // Skip parent's codegen check (Gluten doesn't use WholeStageCodegen).
+    // Only run the Gluten-aware logical plan tag check.
+    checkGlutenLogicalPlanTag(plan)
+  }
+
+  private def isFinalAgg(aggExprs: Seq[AggregateExpression]): Boolean = {
+    aggExprs.nonEmpty && aggExprs.forall(ae => ae.mode == Complete || ae.mode == Final)
+  }
+
+  private def checkGlutenLogicalPlanTag(plan: SparkPlan): Unit = {
+    plan match {
+      // Joins (Gluten + Spark)
+      case _: BroadcastHashJoinExecTransformerBase | _: ShuffledHashJoinExecTransformerBase |
+          _: SortMergeJoinExecTransformerBase | _: CartesianProductExecTransformer |
+          _: BroadcastNestedLoopJoinExecTransformer | _: joins.BroadcastHashJoinExec |
+          _: joins.ShuffledHashJoinExec | _: joins.SortMergeJoinExec |
+          _: joins.BroadcastNestedLoopJoinExec | _: joins.CartesianProductExec =>
+        assertLogicalPlanType[Join](plan)
+
+      // Aggregates - only final (Gluten + Spark)
+      case agg: HashAggregateExecBaseTransformer if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+      case agg: aggregate.HashAggregateExec if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+      case agg: aggregate.ObjectHashAggregateExec if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+      case agg: aggregate.SortAggregateExec if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+
+      // Window
+      case _: WindowExecTransformer | _: window.WindowExec =>
+        assertLogicalPlanType[Window](plan)
+
+      // Union
+      case _: ColumnarUnionExec | _: UnionExec =>
+        assertLogicalPlanType[Union](plan)
+
+      // Sample
+      case _: SampleExec =>
+        assertLogicalPlanType[Sample](plan)
+
+      // Generate
+      case _: GenerateExecTransformerBase | _: GenerateExec =>
+        assertLogicalPlanType[Generate](plan)
+
+      // Exchange nodes should NOT have logical plan tags
+      case _: ColumnarShuffleExchangeExec | _: ColumnarBroadcastExchangeExec |
+          _: exchange.ShuffleExchangeExec | _: exchange.BroadcastExchangeExec |
+          _: ReusedExchangeExec =>
+        assert(
+          plan.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).isEmpty,
+          s"${plan.getClass.getSimpleName} should not have a logical plan tag")
+
+      // Subquery exec nodes don't have logical plan tags
+      case _: SubqueryExec | _: ReusedSubqueryExec =>
+        assert(plan.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).isEmpty)
+
+      // Gluten infrastructure nodes (no corresponding logical plan)
+      case _: WholeStageTransformer | _: InputIteratorTransformer | _: ColumnarInputAdapter |
+          _: VeloxResizeBatchesExec =>
+      // These are Gluten-specific wrapper nodes without logical plan links.
+
+      // Scan trees
+      case _ if isGlutenScanPlanTree(plan) =>
+        // For scan plan trees (leaf under Project/Filter), we check that the leaf node
+        // has a correct logical plan link. The intermediate Project/Filter nodes may not
+        // have tags if they were created by Gluten's rewrite rules.
+        val physicalLeaves = plan.collectLeaves()
+        assert(
+          physicalLeaves.length == 1,
+          s"Expected 1 physical leaf, got ${physicalLeaves.length}")
+
+        val leafNode = physicalLeaves.head
+        // Find the logical plan from the leaf or any ancestor with a tag
+        val logicalPlanOpt = leafNode
+          .getTagValue(SparkPlan.LOGICAL_PLAN_TAG)
+          .orElse(leafNode.getTagValue(SparkPlan.LOGICAL_PLAN_INHERITED_TAG))
+          .orElse(findLogicalPlanInTree(plan))
+
+        logicalPlanOpt.foreach {
+          lp =>
+            val logicalPlan = lp match {
+              case w: WithCTE => w.plan
+              case o => o
+            }
+            val logicalLeaves = logicalPlan.collectLeaves()
+            assert(
+              logicalLeaves.length == 1,
+              s"Expected 1 logical leaf, got ${logicalLeaves.length}")
+            physicalLeaves.head match {
+              case _: RangeExec => assert(logicalLeaves.head.isInstanceOf[Range])
+              case _: DataSourceScanExec | _: BasicScanExecTransformer =>
+                assert(logicalLeaves.head.isInstanceOf[LogicalRelation])
+              case _: InMemoryTableScanExec =>
+                assert(logicalLeaves.head.isInstanceOf[columnar.InMemoryRelation])
+              case _: LocalTableScanExec => assert(logicalLeaves.head.isInstanceOf[LocalRelation])
+              case _: ExternalRDDScanExec[_] =>
+                assert(logicalLeaves.head.isInstanceOf[ExternalRDD[_]])
+              case _: datasources.v2.BatchScanExec =>
+                assert(logicalLeaves.head.isInstanceOf[DataSourceV2Relation])
+              case _ =>
+            }
+        }
+        return
+
+      case _ =>
+    }
+
+    plan.children.foreach(checkGlutenLogicalPlanTag)
+    plan.subqueries.foreach(checkGlutenLogicalPlanTag)
+  }
+
+  @scala.annotation.tailrec
+  private def isGlutenScanPlanTree(plan: SparkPlan): Boolean = plan match {
+    case ColumnarToRowExec(i: InputAdapter) => isGlutenScanPlanTree(i.child)
+    case p: ProjectExec => isGlutenScanPlanTree(p.child)
+    case p: ProjectExecTransformer => isGlutenScanPlanTree(p.child)
+    case f: FilterExec => isGlutenScanPlanTree(f.child)
+    case f: FilterExecTransformerBase => isGlutenScanPlanTree(f.child)
+    case _: LeafExecNode => true
+    case _ => false
+  }
+
+  /** Find any node in the tree that has a LOGICAL_PLAN_TAG. */
+  private def findLogicalPlanInTree(plan: SparkPlan): Option[LogicalPlan] = {
+    plan
+      .getTagValue(SparkPlan.LOGICAL_PLAN_TAG)
+      .orElse(plan.getTagValue(SparkPlan.LOGICAL_PLAN_INHERITED_TAG))
+      .orElse(plan.children.collectFirst {
+        case child if findLogicalPlanInTree(child).isDefined => findLogicalPlanInTree(child).get
+      })
+  }
+
+  private def getGlutenLogicalPlan(node: SparkPlan): LogicalPlan = {
+    node.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).getOrElse {
+      node.getTagValue(SparkPlan.LOGICAL_PLAN_INHERITED_TAG).getOrElse {
+        fail(node.getClass.getSimpleName + " does not have a logical plan link")
+      }
+    }
+  }
+
+  private def assertLogicalPlanType[T <: LogicalPlan: ClassTag](node: SparkPlan): Unit = {
+    val logicalPlan = getGlutenLogicalPlan(node)
+    val expectedCls = implicitly[ClassTag[T]].runtimeClass
+    assert(
+      expectedCls == logicalPlan.getClass,
+      s"Expected ${expectedCls.getSimpleName} but got ${logicalPlan.getClass.getSimpleName}" +
+        s" for ${node.getClass.getSimpleName}"
+    )
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
index fc2d4521e7f7..46c75f9e112d 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/gluten/utils/velox/VeloxTestSettings.scala
@@ -701,7 +701,7 @@ class VeloxTestSettings extends BackendTestSettings {
     .exclude("root OFFSET preserves data ordering with CollectLimitExec")
     .exclude("middle OFFSET preserves data ordering with the extra sort")
   enableSuite[GlutenLocalTempViewTestSuite]
-  // TODO: 4.x enableSuite[GlutenLogicalPlanTagInSparkPlanSuite]  // RUN ABORTED
+  enableSuite[GlutenLogicalPlanTagInSparkPlanSuite]
   enableSuite[GlutenOptimizeMetadataOnlyQuerySuite]
   enableSuite[GlutenPersistedViewTestSuite]
   enableSuite[GlutenPlannerSuite]
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala
index 297d3b2a3428..a01c81a08fa3 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/execution/GlutenLogicalPlanTagInSparkPlanSuite.scala
@@ -16,8 +16,176 @@
  */
 package org.apache.spark.sql.execution
 
+import org.apache.gluten.execution._
+
 import org.apache.spark.sql.GlutenSQLTestsTrait
+import org.apache.spark.sql.catalyst.expressions.aggregate.{AggregateExpression, Complete, Final}
+import org.apache.spark.sql.catalyst.plans.logical._
+import org.apache.spark.sql.execution.columnar.InMemoryTableScanExec
+import org.apache.spark.sql.execution.datasources.LogicalRelation
+import org.apache.spark.sql.execution.datasources.v2.DataSourceV2Relation
+import org.apache.spark.sql.execution.exchange.ReusedExchangeExec
+
+import scala.reflect.ClassTag
 
 class GlutenLogicalPlanTagInSparkPlanSuite
   extends LogicalPlanTagInSparkPlanSuite
-  with GlutenSQLTestsTrait {}
+  with GlutenSQLTestsTrait {
+
+  // Override to use Gluten-aware logical plan tag checking.
+  // Gluten replaces Spark physical operators with Transformer nodes that don't match
+  // the original Spark pattern matching in LogicalPlanTagInSparkPlanSuite.
+  override protected def checkGeneratedCode(
+      plan: SparkPlan,
+      checkMethodCodeSize: Boolean = true): Unit = {
+    // Skip parent's codegen check (Gluten doesn't use WholeStageCodegen).
+    // Only run the Gluten-aware logical plan tag check.
+    checkGlutenLogicalPlanTag(plan)
+  }
+
+  private def isFinalAgg(aggExprs: Seq[AggregateExpression]): Boolean = {
+    aggExprs.nonEmpty && aggExprs.forall(ae => ae.mode == Complete || ae.mode == Final)
+  }
+
+  private def checkGlutenLogicalPlanTag(plan: SparkPlan): Unit = {
+    plan match {
+      // Joins (Gluten + Spark)
+      case _: BroadcastHashJoinExecTransformerBase | _: ShuffledHashJoinExecTransformerBase |
+          _: SortMergeJoinExecTransformerBase | _: CartesianProductExecTransformer |
+          _: BroadcastNestedLoopJoinExecTransformer | _: joins.BroadcastHashJoinExec |
+          _: joins.ShuffledHashJoinExec | _: joins.SortMergeJoinExec |
+          _: joins.BroadcastNestedLoopJoinExec | _: joins.CartesianProductExec =>
+        assertLogicalPlanType[Join](plan)
+
+      // Aggregates - only final (Gluten + Spark)
+      case agg: HashAggregateExecBaseTransformer if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+      case agg: aggregate.HashAggregateExec if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+      case agg: aggregate.ObjectHashAggregateExec if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+      case agg: aggregate.SortAggregateExec if isFinalAgg(agg.aggregateExpressions) =>
+        assertLogicalPlanType[Aggregate](plan)
+
+      // Window
+      case _: WindowExecTransformer | _: window.WindowExec =>
+        assertLogicalPlanType[Window](plan)
+
+      // Union
+      case _: ColumnarUnionExec | _: UnionExec =>
+        assertLogicalPlanType[Union](plan)
+
+      // Sample
+      case _: SampleExec =>
+        assertLogicalPlanType[Sample](plan)
+
+      // Generate
+      case _: GenerateExecTransformerBase | _: GenerateExec =>
+        assertLogicalPlanType[Generate](plan)
+
+      // Exchange nodes should NOT have logical plan tags
+      case _: ColumnarShuffleExchangeExec | _: ColumnarBroadcastExchangeExec |
+          _: exchange.ShuffleExchangeExec | _: exchange.BroadcastExchangeExec |
+          _: ReusedExchangeExec =>
+        assert(
+          plan.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).isEmpty,
+          s"${plan.getClass.getSimpleName} should not have a logical plan tag")
+
+      // Subquery exec nodes don't have logical plan tags
+      case _: SubqueryExec | _: ReusedSubqueryExec =>
+        assert(plan.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).isEmpty)
+
+      // Gluten infrastructure nodes (no corresponding logical plan)
+      case _: WholeStageTransformer | _: InputIteratorTransformer | _: ColumnarInputAdapter |
+          _: VeloxResizeBatchesExec =>
+      // These are Gluten-specific wrapper nodes without logical plan links.
+
+      // Scan trees
+      case _ if isGlutenScanPlanTree(plan) =>
+        // For scan plan trees (leaf under Project/Filter), we check that the leaf node
+        // has a correct logical plan link. The intermediate Project/Filter nodes may not
+        // have tags if they were created by Gluten's rewrite rules.
+        val physicalLeaves = plan.collectLeaves()
+        assert(
+          physicalLeaves.length == 1,
+          s"Expected 1 physical leaf, got ${physicalLeaves.length}")
+
+        val leafNode = physicalLeaves.head
+        // Find the logical plan from the leaf or any ancestor with a tag
+        val logicalPlanOpt = leafNode
+          .getTagValue(SparkPlan.LOGICAL_PLAN_TAG)
+          .orElse(leafNode.getTagValue(SparkPlan.LOGICAL_PLAN_INHERITED_TAG))
+          .orElse(findLogicalPlanInTree(plan))
+
+        logicalPlanOpt.foreach {
+          lp =>
+            val logicalPlan = lp match {
+              case w: WithCTE => w.plan
+              case o => o
+            }
+            val logicalLeaves = logicalPlan.collectLeaves()
+            assert(
+              logicalLeaves.length == 1,
+              s"Expected 1 logical leaf, got ${logicalLeaves.length}")
+            physicalLeaves.head match {
+              case _: RangeExec => assert(logicalLeaves.head.isInstanceOf[Range])
+              case _: DataSourceScanExec | _: BasicScanExecTransformer =>
+                assert(logicalLeaves.head.isInstanceOf[LogicalRelation])
+              case _: InMemoryTableScanExec =>
+                assert(logicalLeaves.head.isInstanceOf[columnar.InMemoryRelation])
+              case _: LocalTableScanExec => assert(logicalLeaves.head.isInstanceOf[LocalRelation])
+              case _: ExternalRDDScanExec[_] =>
+                assert(logicalLeaves.head.isInstanceOf[ExternalRDD[_]])
+              case _: datasources.v2.BatchScanExec =>
+                assert(logicalLeaves.head.isInstanceOf[DataSourceV2Relation])
+              case _ =>
+            }
+        }
+        return
+
+      case _ =>
+    }
+
+    plan.children.foreach(checkGlutenLogicalPlanTag)
+    plan.subqueries.foreach(checkGlutenLogicalPlanTag)
+  }
+
+  @scala.annotation.tailrec
+  private def isGlutenScanPlanTree(plan: SparkPlan): Boolean = plan match {
+    case ColumnarToRowExec(i: InputAdapter) => isGlutenScanPlanTree(i.child)
+    case p: ProjectExec => isGlutenScanPlanTree(p.child)
+    case p: ProjectExecTransformer => isGlutenScanPlanTree(p.child)
+    case f: FilterExec => isGlutenScanPlanTree(f.child)
+    case f: FilterExecTransformerBase => isGlutenScanPlanTree(f.child)
+    case _: LeafExecNode => true
+    case _ => false
+  }
+
+  /** Find any node in the tree that has a LOGICAL_PLAN_TAG. */
+  private def findLogicalPlanInTree(plan: SparkPlan): Option[LogicalPlan] = {
+    plan
+      .getTagValue(SparkPlan.LOGICAL_PLAN_TAG)
+      .orElse(plan.getTagValue(SparkPlan.LOGICAL_PLAN_INHERITED_TAG))
+      .orElse(plan.children.collectFirst {
+        case child if findLogicalPlanInTree(child).isDefined => findLogicalPlanInTree(child).get
+      })
+  }
+
+  private def getGlutenLogicalPlan(node: SparkPlan): LogicalPlan = {
+    node.getTagValue(SparkPlan.LOGICAL_PLAN_TAG).getOrElse {
+      node.getTagValue(SparkPlan.LOGICAL_PLAN_INHERITED_TAG).getOrElse {
+        fail(node.getClass.getSimpleName + " does not have a logical plan link")
+      }
+    }
+  }
+
+  private def assertLogicalPlanType[T <: LogicalPlan: ClassTag](node: SparkPlan): Unit = {
+    val logicalPlan = getGlutenLogicalPlan(node)
+    val expectedCls = implicitly[ClassTag[T]].runtimeClass
+    assert(
+      expectedCls == logicalPlan.getClass,
+      s"Expected ${expectedCls.getSimpleName} but got ${logicalPlan.getClass.getSimpleName}" +
+        s" for ${node.getClass.getSimpleName}"
+    )
+  }
+}

From 431721f79d12b7d4d7c704288cabfc9e4a89a046 Mon Sep 17 00:00:00 2001
From: Chang chen <changchen@microsoft.com>
Date: Thu, 26 Mar 2026 10:35:07 +0000
Subject: [PATCH 12/12] Fix GlutenSparkSessionJobTaggingAndCancellationSuite
 flaky: use System.setProperty

The parent suite extends SparkFunSuite with LocalSparkContext, creating its own
SparkContext per test. Using GlutenTestsTrait creates a shared SparkSession in
beforeAll() that conflicts with per-test SparkContext creation.

Fix: Use GlutenTestsCommonTrait + System.setProperty pattern (same as
GlutenSQLExecutionSuite) so per-test SparkContexts inherit GlutenPlugin config
via system properties without session conflicts.

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 ...essionJobTaggingAndCancellationSuite.scala | 21 ++++++++++++++++-
 ...essionJobTaggingAndCancellationSuite.scala | 23 ++++++++++++++++---
 2 files changed, 40 insertions(+), 4 deletions(-)

diff --git a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala
index 8fbb53e24c17..b0b8ae6b2af2 100644
--- a/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala
+++ b/gluten-ut/spark40/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala
@@ -18,4 +18,23 @@ package org.apache.spark.sql
 
 class GlutenSparkSessionJobTaggingAndCancellationSuite
   extends SparkSessionJobTaggingAndCancellationSuite
-  with GlutenTestsTrait {}
+  with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}
diff --git a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala
index 6befbbe213c2..b0b8ae6b2af2 100644
--- a/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala
+++ b/gluten-ut/spark41/src/test/scala/org/apache/spark/sql/GlutenSparkSessionJobTaggingAndCancellationSuite.scala
@@ -16,8 +16,25 @@
  */
 package org.apache.spark.sql
 
-import org.apache.spark.sql.shim.GlutenTestsTrait
-
 class GlutenSparkSessionJobTaggingAndCancellationSuite
   extends SparkSessionJobTaggingAndCancellationSuite
-  with GlutenTestsTrait {}
+  with GlutenTestsCommonTrait {
+
+  override def beforeAll(): Unit = {
+    System.setProperty("spark.plugins", "org.apache.gluten.GlutenPlugin")
+    System.setProperty("spark.memory.offHeap.enabled", "true")
+    System.setProperty("spark.memory.offHeap.size", "1024MB")
+    System.setProperty(
+      "spark.shuffle.manager",
+      "org.apache.spark.shuffle.sort.ColumnarShuffleManager")
+    super.beforeAll()
+  }
+
+  override def afterAll(): Unit = {
+    super.afterAll()
+    System.clearProperty("spark.plugins")
+    System.clearProperty("spark.memory.offHeap.enabled")
+    System.clearProperty("spark.memory.offHeap.size")
+    System.clearProperty("spark.shuffle.manager")
+  }
+}