From 062e170e94782dd492fcfc3c85a9fe0c427fac4d Mon Sep 17 00:00:00 2001
From: Adrian Garcia Badaracco <1755071+adriangb@users.noreply.github.com>
Date: Thu, 25 Dec 2025 20:44:40 -0600
Subject: [PATCH 1/3] add roundtrip tests for Unparser using clickbench / tpch

---
 datafusion/core/tests/sql/mod.rs      |   1 +
 datafusion/core/tests/sql/unparser.rs | 267 ++++++++++++++++++++++++++
 2 files changed, 268 insertions(+)
 create mode 100644 datafusion/core/tests/sql/unparser.rs
diff --git a/datafusion/core/tests/sql/mod.rs b/datafusion/core/tests/sql/mod.rs
index 3052ccf2b68f9..9a1dc5502ee60 100644
--- a/datafusion/core/tests/sql/mod.rs
+++ b/datafusion/core/tests/sql/mod.rs
@@ -70,6 +70,7 @@ mod path_partition;
 mod runtime_config;
 pub mod select;
 mod sql_api;
+mod unparser;
 
 async fn register_aggregate_csv_by_sql(ctx: &SessionContext) {
     let testdata = test_util::arrow_test_data();
diff --git a/datafusion/core/tests/sql/unparser.rs b/datafusion/core/tests/sql/unparser.rs
new file mode 100644
index 0000000000000..fe7b726475dff
--- /dev/null
+++ b/datafusion/core/tests/sql/unparser.rs
@@ -0,0 +1,267 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! SQL unparser tests.
+//! These are integration tests that run TPCH and ClickBench queries with and without an extra
+//! unparse -> parse step to ensure that the unparsed SQL is valid and produces the same results
+//! as the original query.
+
+use std::fs::ReadDir;
+
+use arrow::array::RecordBatch;
+use arrow_schema::Schema;
+use datafusion::common::Result;
+use datafusion::prelude::{ParquetReadOptions, SessionContext};
+use datafusion_physical_plan::ExecutionPlanProperties;
+use datafusion_sql::unparser::Unparser;
+use datafusion_sql::unparser::dialect::DefaultDialect;
+
+const BENCHMARKS_PATH_1: &str = "../../benchmarks/";
+const BENCHMARKS_PATH_2: &str = "./benchmarks/";
+
+fn iterate_queries(dir: ReadDir) -> Vec<TestQuery> {
+    let mut queries = vec![];
+    for entry in dir.flatten() {
+        let Ok(file_type) = entry.file_type() else {
+            continue;
+        };
+        if !file_type.is_file() {
+            continue;
+        }
+        let path = entry.path();
+        let Some(ext) = path.extension() else {
+            continue;
+        };
+        if ext != "sql" {
+            continue;
+        }
+        let name = path.file_stem().unwrap().to_string_lossy().to_string();
+        if let Ok(mut contents) = std::fs::read_to_string(entry.path()) {
+            // If the query contains ;\n it has DML statements like CREATE VIEW which the unparser doesn't support; skip it
+            contents = contents.trim().to_string();
+            if contents.contains(";\n") {
+                println!("Skipping query with multiple statements: {}", name);
+                continue;
+            }
+            queries.push(TestQuery {
+                sql: contents,
+                name,
+            });
+        }
+    }
+    queries
+}
+
+struct TestQuery {
+    sql: String,
+    name: String,
+}
+
+/// Collect SQL for ClickBench queries.
+fn clickbench_queries() -> Vec<TestQuery> {
+    let paths = [BENCHMARKS_PATH_1, BENCHMARKS_PATH_2];
+    let mut queries = vec![];
+    for path in paths {
+        let dir = format!("{}queries/clickbench/queries/", path);
+        println!("Reading ClickBench queries from {dir}");
+        if let Ok(dir) = std::fs::read_dir(dir) {
+            let read = iterate_queries(dir);
+            println!("Found {} ClickBench queries", read.len());
+            queries.extend(read);
+        }
+    }
+    queries.sort_unstable_by_key(|q| q.name.clone());
+    queries
+}
+
+/// Collect SQL for TPC-H queries.
+fn tpch_queries() -> Vec<TestQuery> {
+    let paths = [BENCHMARKS_PATH_1, BENCHMARKS_PATH_2];
+    let mut queries = vec![];
+    for path in paths {
+        let dir = format!("{}queries/", path);
+        println!("Reading TPC-H queries from {dir}");
+        if let Ok(dir) = std::fs::read_dir(dir) {
+            let read = iterate_queries(dir);
+            queries.extend(read);
+        }
+    }
+    println!("Total TPC-H queries found: {}", queries.len());
+    queries.sort_unstable_by_key(|q| q.name.clone());
+    queries
+}
+
+/// Create a new SessionContext for testing that has all ClickBench tables registered.
+async fn clickbench_test_context() -> Result<SessionContext> {
+    let ctx = SessionContext::new();
+    ctx.register_parquet(
+        "hits",
+        "tests/data/clickbench_hits_10.parquet",
+        ParquetReadOptions::default(),
+    )
+    .await?;
+    // Sanity check we found the table by querying it's schema, it should not be empty
+    // Otherwise if the path is wrong the tests will all fail in confusing ways
+    let df = ctx.sql("SELECT * FROM hits LIMIT 1").await?;
+    assert!(
+        !df.schema().fields().is_empty(),
+        "ClickBench 'hits' table not registered correctly"
+    );
+    Ok(ctx)
+}
+
+/// Create a new SessionContext for testing that has all TPC-H tables registered.
+async fn tpch_test_context() -> Result<SessionContext> {
+    let ctx = SessionContext::new();
+    let data_dir = "tests/data/";
+    // All tables have the pattern "tpch_<table_name>_small.parquet"
+    for table in [
+        "customer", "lineitem", "nation", "orders", "part", "partsupp", "region",
+        "supplier",
+    ] {
+        let path = format!("{data_dir}tpch_{table}_small.parquet");
+        ctx.register_parquet(table, &path, ParquetReadOptions::default())
+            .await?;
+        // Sanity check we found the table by querying it's schema, it should not be empty
+        // Otherwise if the path is wrong the tests will all fail in confusing ways
+        let df = ctx.sql(&format!("SELECT * FROM {table} LIMIT 1")).await?;
+        assert!(
+            !df.schema().fields().is_empty(),
+            "TPC-H '{table}' table not registered correctly"
+        );
+    }
+    Ok(ctx)
+}
+
+async fn sort_batches(
+    ctx: &SessionContext,
+    batches: Vec<RecordBatch>,
+    schema: &Schema,
+) -> Result<Vec<RecordBatch>> {
+    let df = ctx.read_batches(batches)?.sort(
+        schema
+            .fields()
+            .iter()
+            .map(|f| datafusion::prelude::col(f.name()).sort(true, false))
+            .collect(),
+    )?;
+    df.collect().await
+}
+
+struct UnparsedTestCaseResult {
+    original: String,
+    unparsed: String,
+    expected: Vec<RecordBatch>,
+    actual: Vec<RecordBatch>,
+}
+
+async fn collect_results(
+    ctx: &SessionContext,
+    original: &str,
+) -> Result<UnparsedTestCaseResult> {
+    let unparser = Unparser::new(&DefaultDialect {});
+    let df = ctx.sql(original).await.map_err(|e| {
+        datafusion::error::DataFusionError::Execution(format!(
+            "Error executing original SQL:\n{}\n\nError: {}",
+            original, e,
+        ))
+    })?;
+    let unparsed = format!(
+        "{:#}",
+        unparser.plan_to_sql(&df.logical_plan()).map_err(|e| {
+            datafusion::error::DataFusionError::Execution(format!(
+                "Error unparsing SQL:\n{}\n\nError: {}",
+                original, e,
+            ))
+        })?
+    );
+    let schema = df.schema().as_arrow().clone();
+    let is_sorted = ctx
+        .state()
+        .create_physical_plan(df.logical_plan())
+        .await?
+        .equivalence_properties()
+        .output_ordering()
+        .is_some();
+    let mut expected = df.collect().await?;
+    let actual_df = ctx.sql(&unparsed).await.map_err(|e| {
+        datafusion::error::DataFusionError::Execution(format!(
+            "Error executing unparsed SQL:\n{}\n\nError: {}",
+            unparsed, e,
+        ))
+    })?;
+    let actual_schema = actual_df.schema().as_arrow().clone();
+    assert_eq!(
+        schema, actual_schema,
+        "Schemas do not match between original and unparsed queries"
+    );
+    let mut actual = actual_df.collect().await.map_err(|e| {
+        datafusion::error::DataFusionError::Execution(format!(
+            "Error executing unparsed SQL.Original SQL:\n{original}\n\nUnparsed SQL:\n{unparsed}\n\nError: {e}",
+        ))
+    })?;
+    if !is_sorted {
+        expected = sort_batches(ctx, expected, &schema).await?;
+        actual = sort_batches(ctx, actual, &schema).await?;
+    }
+    Ok(UnparsedTestCaseResult {
+        original: original.to_string(),
+        unparsed: unparsed.to_string(),
+        expected,
+        actual,
+    })
+}
+
+#[tokio::test]
+async fn test_clickbench_unparser_roundtrip() -> Result<()> {
+    let queries = clickbench_queries();
+    for sql in queries {
+        let ctx = clickbench_test_context().await?;
+        println!("Testing ClickBench query: {}", sql.name);
+        let result = collect_results(&ctx, &sql.sql).await?;
+        assert_eq!(
+            result.expected, result.actual,
+            "Results do not match for ClickBench query.\nOriginal SQL:\n{}\n\nUnparsed SQL:\n{}\n",
+            result.original, result.unparsed
+        );
+    }
+    Ok(())
+}
+
+#[tokio::test]
+async fn test_tpch_unparser_roundtrip() -> Result<()> {
+    let queries = tpch_queries();
+    for sql in queries {
+        let ctx = tpch_test_context().await?;
+        let result = match collect_results(&ctx, &sql.sql).await {
+            Ok(res) => res,
+            Err(e) => {
+                println!(
+                    "Error processing TPC-H query {}: {}\nOriginal SQL:\n{}",
+                    sql.name, e, sql.sql
+                );
+                return Err(e);
+            }
+        };
+        assert_eq!(
+            result.expected, result.actual,
+            "Results do not match for TPC-H query.\nOriginal SQL:\n{}\n\nUnparsed SQL:\n{}\n",
+            result.original, result.unparsed
+        );
+    }
+    Ok(())
+}

From 3019e759676ed81ddb6f5c5d708d3e42f44a929b Mon Sep 17 00:00:00 2001
From: Adrian Garcia Badaracco <1755071+adriangb@users.noreply.github.com>
Date: Thu, 25 Dec 2025 23:20:51 -0600
Subject: [PATCH 2/3] fixed

---
 datafusion/core/tests/sql/unparser.rs     | 418 ++++++++++++++++------
 datafusion/sql/src/unparser/dialect.rs    |  11 +-
 datafusion/sql/src/unparser/plan.rs       |  10 -
 datafusion/sql/tests/cases/plan_to_sql.rs |   2 +-
 4 files changed, 315 insertions(+), 126 deletions(-)

diff --git a/datafusion/core/tests/sql/unparser.rs b/datafusion/core/tests/sql/unparser.rs
index fe7b726475dff..78507b5f9cab4 100644
--- a/datafusion/core/tests/sql/unparser.rs
+++ b/datafusion/core/tests/sql/unparser.rs
@@ -15,24 +15,54 @@
 // specific language governing permissions and limitations
 // under the License.
 
-//! SQL unparser tests.
-//! These are integration tests that run TPCH and ClickBench queries with and without an extra
-//! unparse -> parse step to ensure that the unparsed SQL is valid and produces the same results
-//! as the original query.
+//! SQL Unparser Roundtrip Integration Tests
+//!
+//! This module tests the [`Unparser`] by running queries through a complete roundtrip:
+//! the original SQL is parsed into a logical plan, unparsed back to SQL, then that
+//! generated SQL is parsed and executed. The results are compared to verify semantic
+//! equivalence.
+//!
+//! ## Test Strategy
+//!
+//! Uses real-world benchmark queries (TPC-H and Clickbench) to validate that:
+//! 1. The unparser produces syntactically valid SQL
+//! 2. The unparsed SQL is semantically equivalent (produces identical results)
+//!
+//! ## Query Suites
+//!
+//! - **TPC-H**: Standard decision-support benchmark with 22 complex analytical queries
+//! - **Clickbench**: Web analytics benchmark with 43 queries against a denormalized schema
+//!
+//! [`Unparser`]: datafusion_sql::unparser::Unparser
 
 use std::fs::ReadDir;
+use std::future::Future;
 
 use arrow::array::RecordBatch;
-use arrow_schema::Schema;
 use datafusion::common::Result;
 use datafusion::prelude::{ParquetReadOptions, SessionContext};
+use datafusion_common::Column;
+use datafusion_expr::Expr;
 use datafusion_physical_plan::ExecutionPlanProperties;
 use datafusion_sql::unparser::Unparser;
 use datafusion_sql::unparser::dialect::DefaultDialect;
+use itertools::Itertools;
 
+/// Primary path to benchmark query files (when running from repo root).
 const BENCHMARKS_PATH_1: &str = "../../benchmarks/";
+
+/// Fallback path to benchmark query files (when running from different working directories).
 const BENCHMARKS_PATH_2: &str = "./benchmarks/";
 
+/// Reads all `.sql` files from a directory and converts them to test queries.
+///
+/// Skips files that:
+/// - Are not regular files
+/// - Don't have a `.sql` extension
+/// - Contain multiple SQL statements (indicated by `;\n`)
+///
+/// Multi-statement files are skipped because the unparser doesn't support
+/// DML statements like `CREATE VIEW` that appear in multi-statement Clickbench queries.
 fn iterate_queries(dir: ReadDir) -> Vec<TestQuery> {
     let mut queries = vec![];
     for entry in dir.flatten() {
@@ -54,7 +84,7 @@ fn iterate_queries(dir: ReadDir) -> Vec<TestQuery> {
             // If the query contains ;\n it has DML statements like CREATE VIEW which the unparser doesn't support; skip it
             contents = contents.trim().to_string();
             if contents.contains(";\n") {
-                println!("Skipping query with multiple statements: {}", name);
+                println!("Skipping query with multiple statements: {name}");
                 continue;
             }
             queries.push(TestQuery {
@@ -66,25 +96,36 @@ fn iterate_queries(dir: ReadDir) -> Vec<TestQuery> {
     queries
 }
 
+/// A SQL query loaded from a benchmark file for roundtrip testing.
+///
+/// Each query is identified by its filename (without extension) and contains
+/// the full SQL text to be tested.
 struct TestQuery {
+    /// The SQL query text to test.
     sql: String,
+    /// The query identifier (typically the filename without .sql extension).
     name: String,
 }
 
-/// Collect SQL for ClickBench queries.
+/// Collect SQL for Clickbench queries.
 fn clickbench_queries() -> Vec<TestQuery> {
     let paths = [BENCHMARKS_PATH_1, BENCHMARKS_PATH_2];
     let mut queries = vec![];
     for path in paths {
-        let dir = format!("{}queries/clickbench/queries/", path);
-        println!("Reading ClickBench queries from {dir}");
+        let dir = format!("{path}queries/clickbench/queries/");
+        println!("Reading Clickbench queries from {dir}");
         if let Ok(dir) = std::fs::read_dir(dir) {
             let read = iterate_queries(dir);
-            println!("Found {} ClickBench queries", read.len());
+            println!("Found {} Clickbench queries", read.len());
             queries.extend(read);
         }
     }
-    queries.sort_unstable_by_key(|q| q.name.clone());
+    queries.sort_unstable_by_key(|q| {
+        q.name
+            .split('q')
+            .next_back()
+            .and_then(|num| num.parse::<u32>().ok())
+    });
     queries
 }
 
@@ -93,7 +134,7 @@ fn tpch_queries() -> Vec<TestQuery> {
     let paths = [BENCHMARKS_PATH_1, BENCHMARKS_PATH_2];
     let mut queries = vec![];
     for path in paths {
-        let dir = format!("{}queries/", path);
+        let dir = format!("{path}queries/");
         println!("Reading TPC-H queries from {dir}");
         if let Ok(dir) = std::fs::read_dir(dir) {
             let read = iterate_queries(dir);
@@ -105,7 +146,7 @@ fn tpch_queries() -> Vec<TestQuery> {
     queries
 }
 
-/// Create a new SessionContext for testing that has all ClickBench tables registered.
+/// Create a new SessionContext for testing that has all Clickbench tables registered.
 async fn clickbench_test_context() -> Result<SessionContext> {
     let ctx = SessionContext::new();
     ctx.register_parquet(
@@ -119,7 +160,7 @@ async fn clickbench_test_context() -> Result<SessionContext> {
     let df = ctx.sql("SELECT * FROM hits LIMIT 1").await?;
     assert!(
         !df.schema().fields().is_empty(),
-        "ClickBench 'hits' table not registered correctly"
+        "Clickbench 'hits' table not registered correctly"
     );
     Ok(ctx)
 }
@@ -147,121 +188,280 @@ async fn tpch_test_context() -> Result<SessionContext> {
     Ok(ctx)
 }
 
+/// Sorts record batches by all columns for deterministic comparison.
+///
+/// When comparing query results, we need a canonical ordering so that
+/// semantically equivalent results compare as equal. This function sorts
+/// by all columns in the schema to achieve that.
 async fn sort_batches(
     ctx: &SessionContext,
     batches: Vec<RecordBatch>,
-    schema: &Schema,
 ) -> Result<Vec<RecordBatch>> {
-    let df = ctx.read_batches(batches)?.sort(
-        schema
-            .fields()
-            .iter()
-            .map(|f| datafusion::prelude::col(f.name()).sort(true, false))
-            .collect(),
-    )?;
+    let mut df = ctx.read_batches(batches)?;
+    let schema = df.schema().as_arrow().clone();
+    let sort_exprs = schema
+        .fields()
+        .iter()
+        // Use Column directly, col() causes the column names to be normalized to lowercase
+        .map(|f| {
+            Expr::Column(Column::new_unqualified(f.name().to_string())).sort(true, false)
+        })
+        .collect_vec();
+    if !sort_exprs.is_empty() {
+        df = df.sort(sort_exprs)?;
+    }
     df.collect().await
 }
 
-struct UnparsedTestCaseResult {
-    original: String,
-    unparsed: String,
-    expected: Vec<RecordBatch>,
-    actual: Vec<RecordBatch>,
+/// The outcome of running a single roundtrip test.
+///
+/// A successful test produces [`TestCaseResult::Success`].
+/// All other variants capture different failure modes with enough context to diagnose the issue.
+enum TestCaseResult {
+    /// The unparsed SQL produced identical results to the original.
+    Success,
+
+    /// Both queries executed but produced different results.
+    ///
+    /// This indicates a semantic bug in the unparser where the generated SQL
+    /// has different meaning than the original.
+    ResultsMismatch { original: String, unparsed: String },
+
+    /// The unparser failed to convert the logical plan to SQL.
+    ///
+    /// This may indicate an unsupported SQL feature or a bug in the unparser.
+    UnparseError { original: String, error: String },
+
+    /// The original SQL failed to execute.
+    ///
+    /// This indicates a problem with the test setup (missing tables,
+    /// invalid test data) rather than an unparser issue.
+    ExecutionError { original: String, error: String },
+
+    /// The unparsed SQL failed to execute, even though the original succeeded.
+    ///
+    /// This indicates the unparser generated syntactically invalid SQL or SQL
+    /// that references non-existent columns/tables.
+    UnparsedExecutionError {
+        original: String,
+        unparsed: String,
+        error: String,
+    },
 }
 
-async fn collect_results(
-    ctx: &SessionContext,
-    original: &str,
-) -> Result<UnparsedTestCaseResult> {
+impl TestCaseResult {
+    /// Returns true if the test case represents a failure
+    /// (anything other than [`TestCaseResult::Success`]).
+    fn is_failure(&self) -> bool {
+        !matches!(self, TestCaseResult::Success)
+    }
+
+    /// Formats a detailed error message for the test case into a string.
+    fn format_error(&self, name: &str) -> String {
+        match self {
+            TestCaseResult::Success => String::new(),
+            TestCaseResult::ResultsMismatch { original, unparsed } => {
+                format!(
+                    "Results mismatch for {name}.\nOriginal SQL:\n{original}\n\nUnparsed SQL:\n{unparsed}"
+                )
+            }
+            TestCaseResult::UnparseError { original, error } => {
+                format!("Unparse error for {name}: {error}\nOriginal SQL:\n{original}")
+            }
+            TestCaseResult::ExecutionError { original, error } => {
+                format!("Execution error for {name}: {error}\nOriginal SQL:\n{original}")
+            }
+            TestCaseResult::UnparsedExecutionError {
+                original,
+                unparsed,
+                error,
+            } => {
+                format!(
+                    "Unparsed execution error for {name}: {error}\nOriginal SQL:\n{original}\n\nUnparsed SQL:\n{unparsed}"
+                )
+            }
+        }
+    }
+}
+
+/// Executes a roundtrip test for a single SQL query.
+///
+/// This is the core test logic that:
+/// 1. Parses the original SQL and creates a logical plan
+/// 2. Unparses the logical plan back to SQL
+/// 3. Executes both the original and unparsed queries
+/// 4. Compares the results (sorting if the query has no ORDER BY)
+///
+/// This always uses [`DefaultDialect`] for unparsing.
+///
+/// # Arguments
+///
+/// * `ctx` - Session context with tables registered
+/// * `original` - The original SQL query to test
+///
+/// # Returns
+///
+/// A [`TestCaseResult`] indicating success or the specific failure mode.
+async fn collect_results(ctx: &SessionContext, original: &str) -> TestCaseResult {
     let unparser = Unparser::new(&DefaultDialect {});
-    let df = ctx.sql(original).await.map_err(|e| {
-        datafusion::error::DataFusionError::Execution(format!(
-            "Error executing original SQL:\n{}\n\nError: {}",
-            original, e,
-        ))
-    })?;
-    let unparsed = format!(
-        "{:#}",
-        unparser.plan_to_sql(&df.logical_plan()).map_err(|e| {
-            datafusion::error::DataFusionError::Execution(format!(
-                "Error unparsing SQL:\n{}\n\nError: {}",
-                original, e,
-            ))
-        })?
-    );
-    let schema = df.schema().as_arrow().clone();
-    let is_sorted = ctx
-        .state()
-        .create_physical_plan(df.logical_plan())
-        .await?
-        .equivalence_properties()
-        .output_ordering()
-        .is_some();
-    let mut expected = df.collect().await?;
-    let actual_df = ctx.sql(&unparsed).await.map_err(|e| {
-        datafusion::error::DataFusionError::Execution(format!(
-            "Error executing unparsed SQL:\n{}\n\nError: {}",
-            unparsed, e,
-        ))
-    })?;
-    let actual_schema = actual_df.schema().as_arrow().clone();
-    assert_eq!(
-        schema, actual_schema,
-        "Schemas do not match between original and unparsed queries"
-    );
-    let mut actual = actual_df.collect().await.map_err(|e| {
-        datafusion::error::DataFusionError::Execution(format!(
-            "Error executing unparsed SQL.Original SQL:\n{original}\n\nUnparsed SQL:\n{unparsed}\n\nError: {e}",
-        ))
-    })?;
+
+    // Parse and create logical plan from original SQL
+    let df = match ctx.sql(original).await {
+        Ok(df) => df,
+        Err(e) => {
+            return TestCaseResult::ExecutionError {
+                original: original.to_string(),
+                error: e.to_string(),
+            };
+        }
+    };
+
+    // Unparse the logical plan back to SQL
+    let unparsed = match unparser.plan_to_sql(df.logical_plan()) {
+        Ok(sql) => format!("{sql:#}"),
+        Err(e) => {
+            return TestCaseResult::UnparseError {
+                original: original.to_string(),
+                error: e.to_string(),
+            };
+        }
+    };
+
+    let is_sorted = match ctx.state().create_physical_plan(df.logical_plan()).await {
+        Ok(plan) => plan.equivalence_properties().output_ordering().is_some(),
+        Err(e) => {
+            return TestCaseResult::ExecutionError {
+                original: original.to_string(),
+                error: e.to_string(),
+            };
+        }
+    };
+
+    // Collect results from original query
+    let mut expected = match df.collect().await {
+        Ok(batches) => batches,
+        Err(e) => {
+            return TestCaseResult::ExecutionError {
+                original: original.to_string(),
+                error: e.to_string(),
+            };
+        }
+    };
+
+    // Parse and execute the unparsed SQL
+    let actual_df = match ctx.sql(&unparsed).await {
+        Ok(df) => df,
+        Err(e) => {
+            return TestCaseResult::UnparsedExecutionError {
+                original: original.to_string(),
+                unparsed,
+                error: e.to_string(),
+            };
+        }
+    };
+
+    // Collect results from unparsed query
+    let mut actual = match actual_df.collect().await {
+        Ok(batches) => batches,
+        Err(e) => {
+            return TestCaseResult::UnparsedExecutionError {
+                original: original.to_string(),
+                unparsed,
+                error: e.to_string(),
+            };
+        }
+    };
+
+    // Sort if needed for comparison
     if !is_sorted {
-        expected = sort_batches(ctx, expected, &schema).await?;
-        actual = sort_batches(ctx, actual, &schema).await?;
+        expected = match sort_batches(ctx, expected).await {
+            Ok(batches) => batches,
+            Err(e) => {
+                return TestCaseResult::ExecutionError {
+                    original: original.to_string(),
+                    error: format!("Failed to sort expected results: {e}"),
+                };
+            }
+        };
+        actual = match sort_batches(ctx, actual).await {
+            Ok(batches) => batches,
+            Err(e) => {
+                return TestCaseResult::UnparsedExecutionError {
+                    original: original.to_string(),
+                    unparsed,
+                    error: format!("Failed to sort actual results: {e}"),
+                };
+            }
+        };
     }
-    Ok(UnparsedTestCaseResult {
-        original: original.to_string(),
-        unparsed: unparsed.to_string(),
-        expected,
-        actual,
-    })
-}
 
-#[tokio::test]
-async fn test_clickbench_unparser_roundtrip() -> Result<()> {
-    let queries = clickbench_queries();
-    for sql in queries {
-        let ctx = clickbench_test_context().await?;
-        println!("Testing ClickBench query: {}", sql.name);
-        let result = collect_results(&ctx, &sql.sql).await?;
-        assert_eq!(
-            result.expected, result.actual,
-            "Results do not match for ClickBench query.\nOriginal SQL:\n{}\n\nUnparsed SQL:\n{}\n",
-            result.original, result.unparsed
-        );
+    if expected != actual {
+        TestCaseResult::ResultsMismatch {
+            original: original.to_string(),
+            unparsed,
+        }
+    } else {
+        TestCaseResult::Success
     }
-    Ok(())
 }
 
-#[tokio::test]
-async fn test_tpch_unparser_roundtrip() -> Result<()> {
-    let queries = tpch_queries();
+/// Runs roundtrip tests for a collection of queries and reports results.
+///
+/// Iterates through all queries, running each through [`collect_results`].
+/// Prints colored status (green checkmark for success, red X for failure)
+/// and panics at the end if any tests failed, with detailed error messages.
+///
+/// # Type Parameters
+///
+/// * `F` - Factory function that creates fresh session contexts
+/// * `Fut` - Future type returned by the context factory
+///
+/// # Panics
+///
+/// Panics if any query fails the roundtrip test, displaying all failures.
+async fn run_roundtrip_tests<F, Fut>(
+    suite_name: &str,
+    queries: Vec<TestQuery>,
+    create_context: F,
+) where
+    F: Fn() -> Fut,
+    Fut: Future<Output = Result<SessionContext>>,
+{
+    let mut errors: Vec<String> = vec![];
     for sql in queries {
-        let ctx = tpch_test_context().await?;
-        let result = match collect_results(&ctx, &sql.sql).await {
-            Ok(res) => res,
+        let ctx = match create_context().await {
+            Ok(ctx) => ctx,
             Err(e) => {
-                println!(
-                    "Error processing TPC-H query {}: {}\nOriginal SQL:\n{}",
-                    sql.name, e, sql.sql
-                );
-                return Err(e);
+                println!("\x1b[31m✗\x1b[0m {} query: {}", suite_name, sql.name);
+                errors.push(format!("Failed to create context for {}: {}", sql.name, e));
+                continue;
             }
         };
-        assert_eq!(
-            result.expected, result.actual,
-            "Results do not match for TPC-H query.\nOriginal SQL:\n{}\n\nUnparsed SQL:\n{}\n",
-            result.original, result.unparsed
+        let result = collect_results(&ctx, &sql.sql).await;
+        if result.is_failure() {
+            println!("\x1b[31m✗\x1b[0m {} query: {}", suite_name, sql.name);
+            errors.push(result.format_error(&sql.name));
+        } else {
+            println!("\x1b[32m✓\x1b[0m {} query: {}", suite_name, sql.name);
+        }
+    }
+    if !errors.is_empty() {
+        panic!(
+            "{} {} test(s) failed:\n\n{}",
+            errors.len(),
+            suite_name,
+            errors.join("\n\n---\n\n")
         );
     }
-    Ok(())
+}
+
+#[tokio::test]
+async fn test_clickbench_unparser_roundtrip() {
+    run_roundtrip_tests("Clickbench", clickbench_queries(), clickbench_test_context)
+        .await;
+}
+
+#[tokio::test]
+async fn test_tpch_unparser_roundtrip() {
+    run_roundtrip_tests("TPC-H", tpch_queries(), tpch_test_context).await;
 }
diff --git a/datafusion/sql/src/unparser/dialect.rs b/datafusion/sql/src/unparser/dialect.rs
index 844fa6febcfe9..1a3e1a06db5f1 100644
--- a/datafusion/sql/src/unparser/dialect.rs
+++ b/datafusion/sql/src/unparser/dialect.rs
@@ -298,13 +298,12 @@ impl Dialect for DefaultDialect {
         let id_upper = identifier.to_uppercase();
         // Special case ignore "ID", see https://github.com/sqlparser-rs/sqlparser-rs/issues/1382
         // ID is a keyword in ClickHouse, but we don't want to quote it when unparsing SQL here
-        if (id_upper != "ID" && ALL_KEYWORDS.contains(&id_upper.as_str()))
+        // Also quote identifiers with uppercase letters since unquoted identifiers are
+        // normalized to lowercase by the SQL parser, which would break case-sensitive schemas
+        let needs_quote = (id_upper != "ID" && ALL_KEYWORDS.contains(&id_upper.as_str()))
             || !identifier_regex.is_match(identifier)
-        {
-            Some('"')
-        } else {
-            None
-        }
+            || identifier.chars().any(|c| c.is_ascii_uppercase());
+        if needs_quote { Some('"') } else { None }
     }
 }
 
diff --git a/datafusion/sql/src/unparser/plan.rs b/datafusion/sql/src/unparser/plan.rs
index d56ecb4f1560d..56bf887dbde43 100644
--- a/datafusion/sql/src/unparser/plan.rs
+++ b/datafusion/sql/src/unparser/plan.rs
@@ -499,16 +499,6 @@ impl Unparser<'_> {
                 )
             }
             LogicalPlan::Sort(sort) => {
-                // Sort can be top-level plan for derived table
-                if select.already_projected() {
-                    return self.derive_with_dialect_alias(
-                        "derived_sort",
-                        plan,
-                        relation,
-                        false,
-                        vec![],
-                    );
-                }
                 let Some(query_ref) = query else {
                     return internal_err!(
                         "Sort operator only valid in a statement context."
diff --git a/datafusion/sql/tests/cases/plan_to_sql.rs b/datafusion/sql/tests/cases/plan_to_sql.rs
index 27f4e2cd551cb..46a42ae534af0 100644
--- a/datafusion/sql/tests/cases/plan_to_sql.rs
+++ b/datafusion/sql/tests/cases/plan_to_sql.rs
@@ -1984,7 +1984,7 @@ fn test_complex_order_by_with_grouping() -> Result<()> {
     }, {
         assert_snapshot!(
             sql,
-            @"SELECT j1.j1_id, j1.j1_string, lochierarchy FROM (SELECT j1.j1_id, j1.j1_string, (grouping(j1.j1_id) + grouping(j1.j1_string)) AS lochierarchy, grouping(j1.j1_string), grouping(j1.j1_id) FROM j1 GROUP BY ROLLUP (j1.j1_id, j1.j1_string) ORDER BY lochierarchy DESC NULLS FIRST, CASE WHEN ((grouping(j1.j1_id) + grouping(j1.j1_string)) = 0) THEN j1.j1_id END ASC NULLS LAST) LIMIT 100"
+            @r#"SELECT j1.j1_id, j1.j1_string, lochierarchy FROM (SELECT j1.j1_id, j1.j1_string, (grouping(j1.j1_id) + grouping(j1.j1_string)) AS lochierarchy, grouping(j1.j1_string), grouping(j1.j1_id) FROM j1 GROUP BY ROLLUP (j1.j1_id, j1.j1_string)) ORDER BY lochierarchy DESC NULLS FIRST, CASE WHEN (("grouping(j1.j1_id)" + "grouping(j1.j1_string)") = 0) THEN j1.j1_id END ASC NULLS LAST LIMIT 100"#
         );
     });
 

From 4d6b179a5364d3a87b04ea52c49cf4a2781f5438 Mon Sep 17 00:00:00 2001
From: Adrian Garcia Badaracco <1755071+adriangb@users.noreply.github.com>
Date: Sun, 28 Dec 2025 13:45:42 -0600
Subject: [PATCH 3/3] consolidate benchmark paths

---
 datafusion/core/tests/sql/unparser.rs | 13 ++++---------
 1 file changed, 4 insertions(+), 9 deletions(-)

diff --git a/datafusion/core/tests/sql/unparser.rs b/datafusion/core/tests/sql/unparser.rs
index 78507b5f9cab4..8b56bf67a261c 100644
--- a/datafusion/core/tests/sql/unparser.rs
+++ b/datafusion/core/tests/sql/unparser.rs
@@ -48,11 +48,8 @@ use datafusion_sql::unparser::Unparser;
 use datafusion_sql::unparser::dialect::DefaultDialect;
 use itertools::Itertools;
 
-/// Primary path to benchmark query files (when running from repo root).
-const BENCHMARKS_PATH_1: &str = "../../benchmarks/";
-
-/// Fallback path to benchmark query files (when running from different working directories).
-const BENCHMARKS_PATH_2: &str = "./benchmarks/";
+/// Paths to benchmark query files (supports running from repo root or different working directories).
+const BENCHMARK_PATHS: &[&str] = &["../../benchmarks/", "./benchmarks/"];
 
 /// Reads all `.sql` files from a directory and converts them to test queries.
 ///
@@ -109,9 +106,8 @@ struct TestQuery {
 
 /// Collect SQL for Clickbench queries.
 fn clickbench_queries() -> Vec<TestQuery> {
-    let paths = [BENCHMARKS_PATH_1, BENCHMARKS_PATH_2];
     let mut queries = vec![];
-    for path in paths {
+    for path in BENCHMARK_PATHS {
         let dir = format!("{path}queries/clickbench/queries/");
         println!("Reading Clickbench queries from {dir}");
         if let Ok(dir) = std::fs::read_dir(dir) {
@@ -131,9 +127,8 @@ fn clickbench_queries() -> Vec<TestQuery> {
 
 /// Collect SQL for TPC-H queries.
 fn tpch_queries() -> Vec<TestQuery> {
-    let paths = [BENCHMARKS_PATH_1, BENCHMARKS_PATH_2];
     let mut queries = vec![];
-    for path in paths {
+    for path in BENCHMARK_PATHS {
         let dir = format!("{path}queries/");
         println!("Reading TPC-H queries from {dir}");
         if let Ok(dir) = std::fs::read_dir(dir) {