diff --git a/.github/workflows/extended.yml b/.github/workflows/extended.yml
index e9eb27dd96527..9768d475c9e8c 100644
--- a/.github/workflows/extended.yml
+++ b/.github/workflows/extended.yml
@@ -66,9 +66,10 @@ jobs:
   # Check crate compiles and base cargo check passes
   linux-build-lib:
     name: linux build test
-    runs-on: ubuntu-latest
+    runs-on: ${{ github.repository_owner == 'apache' && format('runs-on={0},family=m8a,cpu=8,image=ubuntu24-full-x64,extras=s3-cache,disk=large,tag=datafusion', github.run_id) || 'ubuntu-latest' }}
     # note: do not use amd/rust container to preserve disk space
     steps:
+      - uses: runs-on/action@cd2b598b0515d39d78c38a02d529db87d2196d1e  # v2.0.3
       - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd  # v6.0.2
         with:
           ref: ${{ github.event.inputs.pr_head_sha }} # will be empty if triggered by push
@@ -80,7 +81,9 @@ jobs:
           source $HOME/.cargo/env
           rustup toolchain install
       - name: Install Protobuf Compiler
-        run: sudo apt-get install -y protobuf-compiler
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y protobuf-compiler
       - name: Prepare cargo build
         run: |
           cargo check --profile ci --all-targets
@@ -90,9 +93,11 @@ jobs:
   linux-test-extended:
     name: cargo test 'extended_tests' (amd64)
     needs: [linux-build-lib]
-    runs-on: ubuntu-latest
+    runs-on: ${{ github.repository_owner == 'apache' && format('runs-on={0},family=m8a,cpu=32,image=ubuntu24-full-x64,extras=s3-cache,disk=large,tag=datafusion,spot=false', github.run_id) || 'ubuntu-latest' }}
+    # spot=false because the tests are long, https://runs-on.com/configuration/spot-instances/#disable-spot-pricing
     # note: do not use amd/rust container to preserve disk space
     steps:
+      - uses: runs-on/action@cd2b598b0515d39d78c38a02d529db87d2196d1e  # v2.0.3
       - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd  # v6.0.2
         with:
           ref: ${{ github.event.inputs.pr_head_sha }} # will be empty if triggered by push
@@ -106,7 +111,9 @@ jobs:
           source $HOME/.cargo/env
           rustup toolchain install
       - name: Install Protobuf Compiler
-        run: sudo apt-get install -y protobuf-compiler
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y protobuf-compiler
       # For debugging, test binaries can be large.
       - name: Show available disk space
         run: |
@@ -133,10 +140,11 @@ jobs:
   # Check answers are correct when hash values collide
   hash-collisions:
     name: cargo test hash collisions (amd64)
-    runs-on: ubuntu-latest
+    runs-on: ${{ github.repository_owner == 'apache' && format('runs-on={0},family=m8a,cpu=16,image=ubuntu24-full-x64,extras=s3-cache,disk=large,tag=datafusion', github.run_id) || 'ubuntu-latest' }}
     container:
       image: amd64/rust
     steps:
+      - uses: runs-on/action@cd2b598b0515d39d78c38a02d529db87d2196d1e  # v2.0.3
       - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd  # v6.0.2
         with:
           ref: ${{ github.event.inputs.pr_head_sha }} # will be empty if triggered by push
@@ -154,10 +162,12 @@ jobs:
 
   sqllogictest-sqlite:
     name: "Run sqllogictests with the sqlite test suite"
-    runs-on: ubuntu-latest
+    runs-on: ${{ github.repository_owner == 'apache' && format('runs-on={0},family=m8a,cpu=48,image=ubuntu24-full-x64,extras=s3-cache,disk=large,tag=datafusion,spot=false', github.run_id) || 'ubuntu-latest' }}
+    # spot=false because the tests are long, https://runs-on.com/configuration/spot-instances/#disable-spot-pricing
     container:
       image: amd64/rust
     steps:
+      - uses: runs-on/action@cd2b598b0515d39d78c38a02d529db87d2196d1e  # v2.0.3
       - uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd  # v6.0.2
         with:
           ref: ${{ github.event.inputs.pr_head_sha }} # will be empty if triggered by push
diff --git a/AGENTS.md b/AGENTS.md
new file mode 100644
index 0000000000000..168f04832aa81
--- /dev/null
+++ b/AGENTS.md
@@ -0,0 +1,376 @@
+# Repository Guidelines for Codex Agents
+
+This repository uses Rust and contains documentation in Markdown and TOML configuration files. Our focus is on delivering robust, maintainable, and high-quality solutions. Please follow these guidelines when contributing.
+
+---
+
+## Toolchain & Workspace Notes
+
+* The workspace pins the Rust toolchain to `1.90.0` via `rust-toolchain.toml` while declaring an MSRV of `1.87.0` in `Cargo.toml`. Use `rustup override set 1.90.0` if you are not already using the bundled toolchain.
+* DataFusion is organised as a large Cargo workspace. Key crates and directories include:
+
+  * `datafusion/core`, `datafusion/execution`, and `datafusion/sql` for the core logical planning, runtime configuration, and SQL planning layers.
+  * `datafusion/optimizer`, `datafusion/physical-optimizer`, `datafusion/pruning`, and `datafusion/physical-plan` for logical/physical rewrite rules, partition pruning, execution plans, and operator implementations (including the metrics subsystem under `physical-plan/src/metrics`).
+  * `datafusion/common`, `datafusion/common-runtime`, and `datafusion/macros` for shared types, error handling, async helpers (`JoinSet`, `SpawnedTask`), tracing hooks, and macro utilities.
+  * `datafusion/catalog` plus `datafusion/catalog-listing` for catalog APIs and listing-table helpers.
+  * `datafusion/datasource` and the `datafusion/datasource-*` crates for shared datasource utilities and connectors (Avro, CSV, JSON, Parquet).
+  * `datafusion/physical-expr`, `datafusion/physical-expr-common`, and `datafusion/physical-expr-adapter` for physical expression evaluation, property tracking, and schema rewriting.
+  * `datafusion/functions-*` crates covering scalar, aggregate, window, nested, and table functions together with shared utilities.
+  * `datafusion/proto`, `datafusion/proto-common`, and `datafusion/substrait` for protocol buffers, Flight SQL/CLI integration, and Substrait representations, alongside `datafusion/doc` for developer-focused documentation builds.
+  * `datafusion-cli`, `datafusion-examples`, `benchmarks`, and `test-utils` for the CLI binary, runnable examples, benchmarking harnesses, and reusable test helpers.
+
+## 1. Solution-First Approach
+
+* **Understand the Problem:** Before writing code, ensure you clearly understand the requirements and desired outcomes. Ask clarifying questions if anything is ambiguous.
+* **Design Thoughtfully:** Sketch out the architecture or data flow. Consider performance, scalability, and readability.
+* **Provide Examples:** Include usage examples or code snippets demonstrating how your feature or fix works.
+
+## 2. Code Quality & Best Practices
+
+### Idiomatic Rust
+
+* Prefer `snake_case` for variables, functions, and modules; `CamelCase` for types and enums.
+* Use pattern matching, `Option<T>`, and `Result<T, E>` for clear and safe handling of optionality and errors.
+* **Think of `Option` as a computation pipeline, not just "value or no value."** Stop treating `Option` merely as presence/absence—view it as a lazy transformation stream. Combinators like `.map()`, `.and_then()`, `.filter()`, and `.ok_or()` turn error-handling into declarative data flow. Once you internalize absence as a first-class transformation, you can write entire algorithms that never mention control flow explicitly—yet remain 100% safe and compiler-analyzable. This paradigm shift transforms imperative conditionals into composable, chainable operations.
+* Leverage iterators and functional constructs for concise, efficient code.
+* **Refactor imperative traversals** (e.g. using `.apply()` with mutable flags) **into declarative expressions** (e.g. using `.exists()`, `.any()`, or `.find()`) wherever possible. This makes the intent clearer, eliminates boilerplate, and improves maintainability.
+
+  > ✅ *Example:* Convert verbose recursion with `mut` flags into `.exists()` + `.unwrap()` patterns for simple boolean checks.
+* **Simplify match arms by directly binding variables** (e.g. `LogicalPlan::Foo(x)` instead of `LogicalPlan::Foo(_)` + `if let`). This reduces redundant re-matching and enhances clarity.
+
+  > ✅ *Example:* Collapse a redundant `if let` on a known variant by binding it directly in the `match` arm.
+  > Also take the opportunity to **clarify comments or add TODOs**, especially around complex control flows like CTEs or plan rewriting.
+
+#### Ergonomic function signatures (use `Into` / `AsRef` / `IntoIterator`)
+
+When writing or refactoring functions—especially builder setters and public APIs—prefer signatures that are ergonomic for callers while preserving performance and clarity.
+
+Use these patterns deliberately:
+
+* **Own a value:** accept `impl Into<T>` and convert internally (e.g. `host: impl Into<String>`, `path: impl Into<PathBuf>`).
+* This lets callers pass `String`/`&str`, `PathBuf`/`&Path`, etc., without manual `.to_string()` / `.into()`.
+* **Borrow read-only inputs:** accept `impl AsRef<str>` / `impl AsRef<Path>` when you do not need ownership to avoid allocations.
+* **Optional inputs:** accept `impl Into<Option<T>>` for ergonomic option-like parameters (`x`, `Some(x)`, or `None`).
+* **Collections / iterables:** accept `impl IntoIterator<Item = T>` (or `Item = impl Into<T>` when appropriate) to support `Vec`, sets, arrays, and iterators.
+
+Guidance:
+* Prefer `AsRef` for hot paths where allocation would be wasteful; prefer `Into` when the function stores/owns the value.
+* Do not use generic conversion bounds when they reduce clarity or introduce ambiguity—favor explicit types where precision matters.
+
+### Rust mental models — think in types and proofs
+
+The following mental models help write safer, clearer, and more idiomatic Rust. These are conceptual shifts — small syntax changes but large design wins.
+
+- 🔥 Ownership → Compile-Time Resource Graph
+
+  > Stop seeing ownership as “who frees memory.”
+  > See it as a **compile-time dataflow graph of resource control**.
+
+  Every `let`, `move`, or `borrow` defines an edge in a graph the compiler statically verifies — ensuring linear usage of scarce resources (files, sockets, locks) **without a runtime GC**. Once you see lifetimes as edges, not annotations, you’re designing **proofs of safety**, not code that merely compiles.
+
+---
+
+- ⚙️ Borrowing → Capability Leasing
+
+  > Stop thinking of borrowing as “taking a reference.”
+  > It’s **temporary permission to mutate or observe**, granted by the compiler’s capability system.
+
+  `&mut` isn’t a pointer — it’s a **lease with exclusive rights**, enforced at compile time. Expert code treats borrows as contracts:
+
+  * If you can shorten them, you increase parallelism.
+  * If you lengthen them, you increase safety scope.
+
+---
+
+- 🧩 Traits → Behavioral Algebra
+
+  > Stop viewing traits as “interfaces.”
+  > They’re **algebraic building blocks** that define composable laws of behavior.
+
+  A `Trait` isn’t just a promise of methods; it’s a **contract that can be combined, derived, or blanket-implemented**. Once you realize traits form a behavioral lattice, you stop subclassing and start composing — expressing polymorphism as **capabilities, not hierarchies**.
+
+---
+
+- 🧠 `Result` → Explicit Control Flow as Data
+
+  > Stop using `Result` as an error type.
+  > It’s **control flow reified as data**.
+
+  The `?` operator turns sequential logic into a **monadic pipeline** — your `Result` chain isn’t linear code; it’s a dependency graph of partial successes. Experts design their APIs so every recoverable branch is an **encoded decision**, not a runtime exception.
+
+---
+
+- 💎 Lifetimes → Static Borrow Slices
+
+  > Stop fearing lifetimes as compiler noise.
+  > They’re **proofs of local consistency** — mini type-level theorems.
+
+  Each `'a` parameter expresses that two pieces of data **coexist safely** within a bounded region of time. Experts deliberately model relationships through lifetime parameters to **eliminate entire classes of runtime checks**.
+
+---
+
+- 🪶 Pattern Matching → Declarative Exhaustiveness
+
+  > Stop thinking of `match` as a fancy switch.
+  > It’s a **total function over variants**, verified at compile time.
+
+  Once you realize `match` isn’t branching but **structural enumeration**, you start writing exhaustive domain models where every possible state is named, and every transition is **type-checked**.
+
+### Maintainability
+
+* Keep functions focused (ideally under 40 lines) and modules cohesive.
+* Name functions and variables descriptively; avoid generic names like `foo` or `temp`.
+* Group related types and functions and document public APIs with `///` comments and examples.
+
+### API Design Principles
+
+When designing structs that carry arguments or configuration (e.g., `AccumulatorArgs`, `PartitionEvaluatorArgs`, `ScalarFunctionArgs`), follow these principles:
+
+#### 1. **Clarity and Simplicity Over Cleverness**
+
+Make contracts explicit. Prefer straightforward data fields over conditional logic, runtime synthesis, or smart defaults that require deep understanding to use correctly.
+
+* ✅ **Good:** `pub input_fields: &'a [FieldRef]` — explicitly provides pre-computed field information
+* ❌ **Avoid:** Synthesizing data on-demand based on whether other fields are empty, forcing users to understand complex fallback logic
+
+**Why:** Users should not need to understand `Cow` semantics, conditional schema synthesis, or when to use `schema.field()` vs helper methods. Self-documenting APIs reduce cognitive load and onboarding time.
+
+#### 2. **Consistency with the Ecosystem**
+
+Align new APIs with existing patterns in the codebase. If scalar and window functions receive pre-evaluated `FieldRef`s, aggregate functions should follow a similar model wherever feasible.
+
+* ✅ **Good:** Provide `input_fields: &[FieldRef]` alongside `exprs: &[Arc<dyn PhysicalExpr>]` to match the ergonomics of `ScalarFunctionArgs` and `PartitionEvaluatorArgs`
+* ❌ **Avoid:** Forcing aggregate UDAFs to call `exprs[i].return_field(schema)?` when other function types receive fields directly
+
+**Why:** Consistency reduces the mental context switch when moving between different parts of the codebase. Developers familiar with one function type can transfer that knowledge directly.
+
+#### 3. **Optimize for Performance Through Pre-Computation**
+
+Pre-compute expensive or frequently accessed information during construction rather than on every access or method call.
+
+* ✅ **Good:** Compute `input_fields` once when building `AggregateFunctionExpr` and store them
+* ❌ **Avoid:** Synthesizing schemas or calling `return_field()` multiple times across `create_accumulator()`, `groups_accumulator_supported()`, `create_groups_accumulator()`, etc.
+
+**Why:** Aggregate expressions are constructed once but may create many accumulators (one per group in hash aggregations). Pre-computation amortizes costs and eliminates redundant work.
+
+#### 4. **Mechanical Changes Beat Conditional Logic**
+
+When faced with a choice between:
+- (A) Adding a field to a struct and updating all call sites mechanically
+- (B) Adding conditional logic that synthesizes or computes values at runtime
+
+Choose (A). Mechanical changes are easier to review, verify, and maintain.
+
+* ✅ **Good:** Add `input_fields` field, update 18 call sites with straightforward additions
+* ❌ **Avoid:** Adding `args_schema()` method with `Cow<Schema>` that conditionally synthesizes based on whether the schema is empty
+
+**Why:** Conditional logic introduces edge cases and potential bugs. Mechanical changes can be reviewed quickly and validated with simple grep/IDE searches. The compiler enforces that all call sites are updated.
+
+#### 5. **Future-Proofing Through Explicit Structure**
+
+Design data structures that can accommodate future features without breaking changes.
+
+* ✅ **Good:** Having explicit `input_fields` makes it easy to add per-field caching, lazy evaluation, or metadata decorators
+* ❌ **Avoid:** Tightly coupling field access to schema lookup patterns that make future optimizations require API redesign
+
+**Why:** Explicit fields provide clear extension points. Adding features like "cache field metadata" or "lazily compute field nullability" becomes straightforward without changing the public API.
+
+#### 6. **Self-Documenting APIs Over Extensive Documentation**
+
+If your API requires 80+ lines of documentation to explain when and why fields behave differently in different contexts, consider redesigning the API.
+
+* ✅ **Good:** `input_fields` is self-documenting — it contains the fields corresponding to input expressions
+* ❌ **Avoid:** Requiring users to understand: "when schema is empty we synthesize from literals, but when non-empty we use it directly, and you can use either `schema.field()` or `input_field()` depending on..."
+
+**Why:** Documentation gets outdated, misread, or overlooked. Self-documenting APIs encode contracts in types that the compiler verifies.
+
+#### Summary Checklist for Argument Structs
+
+When adding or modifying argument structs like `AccumulatorArgs`:
+
+- [ ] Are all frequently accessed fields pre-computed during construction?
+- [ ] Is the API consistent with similar structs (`ScalarFunctionArgs`, `PartitionEvaluatorArgs`)?
+- [ ] Can users access what they need without calling helper methods or understanding conditional logic?
+- [ ] Would the API be clear to someone seeing it for the first time?
+- [ ] Does adding this field require mostly mechanical changes to call sites?
+- [ ] Will this structure accommodate future features without breaking changes?
+
+### Use `take_function_args` when possible
+
+When implementing or refactoring function/aggregate/window argument handling, look for opportunities to replace manual argument-count checks and iterator extraction with the helper `take_function_args`. This reduces boilerplate and makes the code clearer and less error-prone.
+
+Example: replace this pattern
+
+  -        if args.len() != 3 {
+  -            return plan_err!("nvl2 must have exactly three arguments");
+  -        }
+  -
+  -        let mut args = args.into_iter();
+  -        let test = args.next().unwrap();
+  -        let if_non_null = args.next().unwrap();
+  -        let if_null = args.next().unwrap();
+
+with the concise and safer form
+
+  +        let [test, if_non_null, if_null] = take_function_args(self.name(), args)?;
+
+`take_function_args` validates the argument count and returns a fixed-size array for pattern matching. Use it when the arity is known at compile time.
+
+If you answer "no" to multiple questions, consider simplifying the design.
+
+### Error Handling & Context
+
+* Use the `?` operator to propagate errors with context. Avoid silent failures.
+* Implement custom errors via the `thiserror` crate when appropriate.
+* Provide clear messages to aid debugging and user feedback.
+
+### Performance Considerations
+
+* Favor zero-copy patterns: use `&str` over `String` and `Arc<T>` for shared data.
+* Avoid unnecessary heap allocations; minimize cloning.
+* Benchmark critical paths when performance is a concern.
+* Optimizations should be focused on bottlenecks — those steps that are repeated millions of times in a query; otherwise, prefer simplicity.
+
+* Prefer multiple simple code paths over a single complex adaptive path. Optimize for the common case first and keep that path fast and easy to reason about; handle rare or complex edge cases with separate, well-tested branches or fallbacks. This often yields clearer, faster, and more maintainable code than trying to build one highly adaptive, catch-all implementation.
+
+### Benchmark Pattern
+
+When creating or modifying benchmarks in `benchmarks/`, follow this standard pattern:
+
+- **Setup phase (outside loop):** Create a `SessionContext` once per case using `create_context(...) -> Result<SessionContext>`. This builds the plan once and is excluded from timing.
+- **Benchmark loop (timed):** Inside the bench loop, run:
+  - `ctx.sql(...)` — parse SQL and create logical plan
+  - `df.create_physical_plan()` — convert to physical plan
+  - `collect(plan, ctx.task_ctx())` — execute and collect results
+
+The benchmark timing includes **execution**, but the setup phase (context creation and initial planning) happens only once **outside the loop** to measure execution performance accurately.
+
+### Clone & Copy: Precision over Reflex
+
+* **Treat `Clone` as a precision instrument, not a reflex.** Implement custom `Clone` to achieve amortized O(1) behavior where possible — clone only references or indices, not deep data structures, then perform explicit duplication at controlled boundaries.
+* **Reserve `Copy` for plain-old-data only.** Restrict `Copy` to types where move and copy are semantically and computationally indistinguishable: integers, coordinates, short fixed-size math vectors, and similar primitives.
+* **Make ownership boundaries visible.** For everything else, use intentional `Clone` APIs so that duplication shows up clearly in code reviews and profiling. Explicit `.clone()` calls document where data is being duplicated and help identify optimization opportunities.
+* **Design for shared ownership.** Prefer `Arc<T>` and reference-counted patterns over deep cloning when multiple owners need access to the same data. Clone the `Arc`, not the underlying data.
+
+## 3. Testing & Validation
+
+* **Unit Tests:** Cover individual functions and edge cases with `cargo test`. Prefer `cargo test --workspace` when your change crosses crate boundaries, or target specific packages with `-p <crate>` for focused runs.
+* **Integration Tests:** Validate end-to-end behavior, especially for CLI commands or key modules.
+* **Continuous Testing:** Ensure tests run reliably in CI. Use `cargo nextest run --workspace` for faster, parallel execution when configured.
+* **Minimize Test Binaries:** Each test binary requires additional build time and disk space. Consolidate related tests into fewer test files rather than creating many small test binaries. Use `#[cfg(test)]` modules within `src/` files for unit tests, and reserve `tests/` directories for true integration tests that require a separate binary. Group logically related integration tests into shared test files with multiple `#[test]` functions.
+
+* **Prefer SQL Logic Tests (SLT) over snapshots:** For new SQL/engine tests prefer adding SQL Logic Tests (SLT) under `datafusion/sqllogictest/test_files/` instead of creating or relying on snapshot (.snap) files. SLT files are easier to review, maintain, and update. If a snapshot file is absolutely necessary, include a brief justification 
+
+## 4. Documentation & Examples
+
+* Provide clear README updates for new features or changes.
+* Include practical examples in code comments and the `examples/` directory.
+* Update CLI help strings and guides to reflect enhancements.
+
+## 5. Collaboration & Review
+
+* **Pull Requests:** Provide a concise summary of changes, motivation, and how to test.
+* **Code Reviews:** Offer constructive feedback focusing on clarity, correctness, and design.
+* **Discussions:** Use issues to propose major changes or ask design questions.
+
+## 6. Optional Tooling Checks
+
+While linting, formatting, and spelling are important, they should not overshadow solution quality. Please run formatting, linting, and `typos` **after** finalizing your code when applicable:
+
+```bash
+# Optional but recommended:
+./dev/rust_lint.sh    # Formats, lints, and checks docs
+./pre-commit.sh       # Runs clippy and fmt for staged Rust files
+prettier -w <path/to/file.md>  # Formats Markdown
+taplo format --check  # Validates TOML
+typos                 # Checks for spelling mistakes
+```
+
+Ensure these checks pass before merging (run `typos` when applicable), but prioritize delivering clear, well-designed code. `./dev/rust_lint.sh` bootstraps `taplo` automatically if it is missing so that formatting checks match CI.
+
+## Useful Helper Functions
+
+Below are helper modules and functions that simplify common tasks across the codebase:
+
+* `datafusion/common/src/utils/string_utils.rs`
+
+  * `string_array_to_vec` converts Arrow string arrays into `Vec<Option<&str>>` for easier Rust processing.
+* `datafusion/common/src/hash_utils.rs`
+
+  * `combine_hashes` merges two `u64` values and backs hash-related utilities for arrays.
+* `datafusion/common/src/test_util.rs`
+
+  * `format_batches` pretty-prints `RecordBatch` collections.
+  * Macros such as `assert_batches_eq`, `assert_batches_sorted_eq`, `assert_contains`, and `assert_not_contains` aid concise test assertions.
+* `datafusion/expr/src/utils.rs`
+
+  * `grouping_set_expr_count` counts unique grouping expressions, accounting for `GROUPING SETS`.
+  * `merge_grouping_set` joins two grouping sets while enforcing size limits.
+  * `cross_join_grouping_sets` builds the Cartesian product of grouping-set combinations.
+* `datafusion/physical-optimizer/src/utils.rs`
+
+  * `add_sort_above` and `add_sort_above_with_check` inject sorting into physical plans.
+  * Helper predicates like `is_sort`, `is_window`, `is_union`, `is_sort_preserving_merge`, `is_coalesce_partitions`, `is_repartition`, and `is_limit` classify execution plan nodes.
+* `datafusion/physical-expr-common/src/utils.rs`
+
+  * `ExprPropertiesNode::new_unknown` initializes property tracking with unknown order and range for expression trees.
+  * `scatter` performs mask-driven array scatter, filling nulls where the mask is false.
+* `datafusion/functions-window/src/utils.rs`
+
+  * `get_signed_integer`, `get_scalar_value_from_args`, and `get_unsigned_integer` handle window-function argument extraction.
+* `datafusion/functions-aggregate-common/src/utils.rs`
+
+  * `get_accum_scalar_values_as_arrays`, `ordering_fields`, and `get_sort_options` support aggregate computation internals, while helpers such as `DecimalAverager` and `Hashable<T>` keep decimal results precise and floating-point hashes stable.
+* `datafusion/sqllogictest/src/util.rs`
+
+  * Utilities like `setup_scratch_dir`, `value_normalizer`, `read_dir_recursive`, `df_value_validator`, and `is_spark_path` assist SQLLogicTest harnesses.
+* `datafusion-cli/src/helper.rs`
+
+  * `CliHelper` offers interactive SQL parsing, dialect switching, and the `split_from_semicolon` helper for multi-statement inputs.
+* `datafusion/functions/src/utils.rs`
+
+  * `make_scalar_function` wraps array-based logic for scalars and arrays, while macros like `utf8_to_str_type` and `utf8_to_int_type` derive optimal return types.
+* `datafusion/functions-nested/src/utils.rs`
+
+  * `check_datatypes` verifies all array arguments share compatible types, returning an error otherwise.
+  * `make_scalar_function` adapts array-oriented closures to work with `ColumnarValue` inputs and preserves scalar outputs when possible.
+  * `align_array_dimensions` pads nested list arrays so every argument reaches the same number of dimensions.
+* `datafusion/functions-window-common/src/partition.rs`
+
+  * `PartitionEvaluatorArgs` bundles window function arguments, fields, reversal flags, and `IGNORE NULLS` handling for custom evaluators.
+* `datafusion/optimizer/src/utils.rs`
+
+  * Utilities such as `has_all_column_refs`, `replace_qualified_name`, `is_restrict_null_predicate`, and `evaluates_to_null` support query optimizer rules.
+* `datafusion/sql/src/utils.rs`
+
+  * Helpers like `resolve_columns`, `rebase_expr`, and `check_columns_satisfy_exprs` aid SQL planning and validation.
+* `datafusion/common-runtime/src/trace_utils.rs`
+
+  * `set_join_set_tracer`, `trace_future`, and `trace_block` inject consistent instrumentation for asynchronous and blocking workloads.
+* `datafusion/common-runtime/src/join_set.rs` and `datafusion/common-runtime/src/common.rs`
+
+  * `JoinSet` and `SpawnedTask` wrap Tokio primitives with automatic tracing and cancellation to simplify task management.
+* `datafusion/physical-plan/src/metrics`
+
+  * `ExecutionPlanMetricsSet`, `MetricBuilder`, and `BaselineMetrics` streamline exposing counters, timers, and spill statistics from execution operators.
+* `datafusion/physical-expr-adapter/src/schema_rewriter.rs`
+
+  * `PhysicalExprAdapter` and `DefaultPhysicalExprAdapterFactory` rewrite physical expressions to match differing logical and physical schemas, handling casts, missing columns, and partition values.
+
+## Commenting guidance
+
+Use three complementary kinds of comments in the codebase to keep intent clear and the public API documented:
+
+- Implementation Comments
+  - Explains non-obvious choices and tricky implementations.
+  - Serves as breadcrumbs for future developers when reasoning about why code is written in a particular way.
+
+- Documentation Comments
+  - Describes functions, types, traits, modules and their public behaviour and contracts.
+  - Acts as the public interface documentation (prefer `///` Rust doc comments for public Rust items).
+
+- Contextual Comments
+  - Documents assumptions, preconditions, invariants, and non-obvious requirements.
+  - Use these to record constraints that aren't enforced directly in code (e.g., expected input ranges, thread-safety considerations, or compatibility notes).
+
+Keep comments short, factual, and up-to-date. Prefer code clarity and small helper functions over long explanatory blocks. When a comment becomes longer than a paragraph, prefer extracting intent into a well-named function or adding a `TODO` with a short plan.
diff --git a/datafusion/optimizer/src/simplify_expressions/expr_simplifier.rs b/datafusion/optimizer/src/simplify_expressions/expr_simplifier.rs
index c6644e008645a..5cd286f63b132 100644
--- a/datafusion/optimizer/src/simplify_expressions/expr_simplifier.rs
+++ b/datafusion/optimizer/src/simplify_expressions/expr_simplifier.rs
@@ -2312,7 +2312,7 @@ fn simplify_right_is_one_case(
         Err(_) => Ok(Transformed::yes(*left)),
     }
 }
-
+/// trigger ci extended tests
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/datafusion/sqllogictest/bin/sqllogictests.rs b/datafusion/sqllogictest/bin/sqllogictests.rs
index 3571377354eb4..463b7b03a760c 100644
--- a/datafusion/sqllogictest/bin/sqllogictests.rs
+++ b/datafusion/sqllogictest/bin/sqllogictests.rs
@@ -44,9 +44,11 @@ use datafusion::common::runtime::SpawnedTask;
 use futures::FutureExt;
 use std::ffi::OsStr;
 use std::fs;
-use std::io::{IsTerminal, stdout};
+use std::io::{IsTerminal, stderr, stdout};
 use std::path::{Path, PathBuf};
 use std::str::FromStr;
+use std::sync::Arc;
+use std::sync::atomic::{AtomicUsize, Ordering};
 
 #[cfg(feature = "postgres")]
 mod postgres_container;
@@ -110,6 +112,13 @@ async fn run_tests() -> Result<()> {
 
     options.warn_on_ignored();
 
+    // Print parallelism info for debugging CI performance
+    eprintln!(
+        "Running with {} test threads (available parallelism: {})",
+        options.test_threads,
+        get_available_parallelism()
+    );
+
     #[cfg(feature = "postgres")]
     initialize_postgres_container(&options).await?;
 
@@ -147,6 +156,10 @@ async fn run_tests() -> Result<()> {
     }
 
     let num_tests = test_files.len();
+    // For CI environments without TTY, print progress periodically
+    let is_ci = !stderr().is_terminal();
+    let completed_count = Arc::new(AtomicUsize::new(0));
+
     let errors: Vec<_> = futures::stream::iter(test_files)
         .map(|test_file| {
             let validator = if options.include_sqlite
@@ -162,10 +175,12 @@ async fn run_tests() -> Result<()> {
             let filters = options.filters.clone();
 
             let relative_path = test_file.relative_path.clone();
+            let relative_path_for_timing = test_file.relative_path.clone();
 
             let currently_running_sql_tracker = CurrentlyExecutingSqlTracker::new();
             let currently_running_sql_tracker_clone =
                 currently_running_sql_tracker.clone();
+            let file_start = Instant::now();
             SpawnedTask::spawn(async move {
                 match (
                     options.postgres_runner,
@@ -227,14 +242,38 @@ async fn run_tests() -> Result<()> {
                         )
                         .await?
                     }
+                };
+                // Log slow files (>30s) for CI debugging
+                let elapsed = file_start.elapsed();
+                if elapsed.as_secs() > 30 {
+                    eprintln!(
+                        "Slow file: {} took {:.1}s",
+                        relative_path_for_timing.display(),
+                        elapsed.as_secs_f64()
+                    );
                 }
-                Ok(()) as Result<()>
+                Ok(())
             })
             .join()
             .map(move |result| (result, relative_path, currently_running_sql_tracker))
         })
         // run up to num_cpus streams in parallel
         .buffer_unordered(options.test_threads)
+        .inspect({
+            let completed_count = Arc::clone(&completed_count);
+            move |_| {
+                let completed = completed_count.fetch_add(1, Ordering::Relaxed) + 1;
+                // In CI (no TTY), print progress every 10% or every 50 files
+                if is_ci && (completed.is_multiple_of(50) || completed == num_tests) {
+                    eprintln!(
+                        "Progress: {}/{} files completed ({:.0}%)",
+                        completed,
+                        num_tests,
+                        (completed as f64 / num_tests as f64) * 100.0
+                    );
+                }
+            }
+        })
         .flat_map(|(result, test_file_path, current_sql)| {
             // Filter out any Ok() leaving only the DataFusionErrors
             futures::stream::iter(match result {