lance-format · yanghua · Jul 16, 2025 · Jun 25, 2025 · Jun 25, 2025 · Jun 25, 2025
diff --git a/rust/lance/src/dataset.rs b/rust/lance/src/dataset.rs
@@ -60,6 +60,7 @@ pub mod refs;
 pub(crate) mod rowids;
 pub mod scanner;
 mod schema_evolution;
+pub mod sql;
 pub mod statistics;
 mod take;
 pub mod transaction;
@@ -74,6 +75,7 @@ use self::refs::Tags;
 use self::scanner::{DatasetRecordBatchStream, Scanner};
 use self::transaction::{Operation, Transaction};
 use self::write::write_fragments_internal;
+use crate::dataset::sql::SqlQueryBuilder;
 use crate::datatypes::Schema;
 use crate::error::box_error;
 use crate::io::commit::{
@@ -1449,6 +1451,13 @@ impl Dataset {
         *self = self.checkout_version(latest_version).await?;
         Ok(())
     }
+
+    /// Run a SQL query against the dataset.
+    /// The underlying SQL engine is DataFusion.
+    /// Please refer to the DataFusion documentation for supported SQL syntax.
+    pub fn sql(&mut self, sql: &str) -> SqlQueryBuilder {
+        SqlQueryBuilder::new(self.clone(), sql)
+    }
 }
 
 pub(crate) struct NewTransactionResult<'a> {

diff --git a/rust/lance/src/dataset/sql.rs b/rust/lance/src/dataset/sql.rs
@@ -0,0 +1,214 @@
+// SPDX-License-Identifier: Apache-2.0
+// SPDX-FileCopyrightText: Copyright The Lance Authors
+
+use crate::datafusion::LanceTableProvider;
+use crate::Dataset;
+use arrow_array::{Array, RecordBatch, StringArray};
+use datafusion::dataframe::DataFrame;
+use datafusion::execution::SendableRecordBatchStream;
+use datafusion::prelude::SessionContext;
+use std::sync::Arc;
+
+/// A SQL builder to prepare options for running SQL queries against a Lance dataset.
+#[derive(Clone, Debug)]
+pub struct SqlQueryBuilder {
+    /// The dataset to run the SQL query
+    pub(crate) dataset: Dataset,
+
+    /// The SQL query to run
+    pub(crate) sql: String,
+
+    /// the name of the table to register in the datafusion context
+    pub(crate) table_name: String,
+
+    /// If true, the query result will include the internal row id
+    pub(crate) with_row_id: bool,
+
+    /// If true, the query result will include the internal row address
+    pub(crate) with_row_addr: bool,
+}
+
+impl SqlQueryBuilder {
+    pub fn new(dataset: Dataset, sql: &str) -> Self {
+        Self {
+            dataset,
+            sql: sql.to_string(),
+            table_name: "dataset".to_string(),
+            with_row_id: false,
+            with_row_addr: false,
+        }
+    }
+
+    /// The table name to register in the datafusion context.
+    /// This is used to specify a "table name" for the dataset.
+    /// So that you can run SQL queries against it.
+    /// If not set, the default table name is "dataset".
+    pub fn table_name(mut self, table_name: &str) -> Self {
+        self.table_name = table_name.to_string();
+        self
+    }
+
+    /// Specify if the query result should include the internal row id.
+    /// If true, the query result will include an additional column named "_rowid".
+    pub fn with_row_id(mut self, row_id: bool) -> Self {
+        self.with_row_id = row_id;
+        self
+    }
+
+    /// Specify if the query result should include the internal row address.
+    /// If true, the query result will include an additional column named "_rowaddr".
+    pub fn with_row_addr(mut self, row_addr: bool) -> Self {
+        self.with_row_addr = row_addr;
+        self
+    }
+
+    pub async fn build(self) -> lance_core::Result<SqlQuery> {
+        let ctx = SessionContext::new();
+        let row_id = self.with_row_id;
+        let row_addr = self.with_row_addr;
+        ctx.register_table(
+            self.table_name,
+            Arc::new(LanceTableProvider::new(
+                Arc::new(self.dataset.clone()),
+                row_id,
+                row_addr,
+            )),
+        )?;
+        let df = ctx.sql(&self.sql).await?;
+        Ok(SqlQuery::new(df))
+    }
+}
+
+pub struct SqlQuery {
+    dataframe: DataFrame,
+}
+
+impl SqlQuery {
+    pub fn new(dataframe: DataFrame) -> Self {
+        Self { dataframe }
+    }
+
+    pub async fn into_stream(self) -> SendableRecordBatchStream {
+        self.dataframe.execute_stream().await.unwrap()
+    }
+
+    pub async fn into_batch_records(self) -> lance_core::Result<Vec<RecordBatch>> {
+        use futures::TryStreamExt;
+        Ok(self
+            .dataframe
+            .execute_stream()
+            .await
+            .unwrap()
+            .try_collect::<Vec<_>>()
+            .await?)
+    }
+
+    pub fn into_dataframe(self) -> DataFrame {
+        self.dataframe
+    }
+
+    pub async fn into_explain_plan(
+        self,
+        verbose: bool,
+        analyze: bool,
+    ) -> lance_core::Result<String> {
+        let explained_df = self.dataframe.explain(verbose, analyze)?;
+        let batches = explained_df.collect().await?;
+        let mut lines = Vec::new();
+        for batch in &batches {
+            let column = batch.column(0);
+            let array = column
+                .as_any()
+                .downcast_ref::<StringArray>()
+                .expect("Expected StringArray in 'plan' column for DataFrame.explain");
+            for i in 0..array.len() {
+                lines.push(array.value(i).to_string());
+            }
+        }
+
+        Ok(lines.join("\n"))
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use crate::utils::test::{DatagenExt, FragmentCount, FragmentRowCount};
+    use all_asserts::assert_true;
+    use arrow_array::cast::AsArray;
+    use arrow_array::types::{Int32Type, Int64Type, UInt64Type};
+    use lance_datagen::{array, gen};
+
+    #[tokio::test]
+    async fn test_sql_execute() {
+        let mut ds = gen()
+            .col("x", array::step::<Int32Type>())
+            .col("y", array::step_custom::<Int32Type>(0, 2))
+            .into_dataset(
+                "memory://test_sql_dataset",
+                FragmentCount::from(10),
+                FragmentRowCount::from(10),
+            )
+            .await
+            .unwrap();
+
+        let results = ds
+            .sql("SELECT SUM(x) FROM foo WHERE y > 100")
+            .table_name("foo")
+            .build()
+            .await
+            .unwrap()
+            .into_batch_records()
+            .await
+            .unwrap();
+        pretty_assertions::assert_eq!(results.len(), 1);
+        let results = results.into_iter().next().unwrap();
+        pretty_assertions::assert_eq!(results.num_columns(), 1);
+        pretty_assertions::assert_eq!(results.num_rows(), 1);
+        // SUM(0..100) - SUM(0..50) = 3675
+        pretty_assertions::assert_eq!(results.column(0).as_primitive::<Int64Type>().value(0), 3675);
+
+        let results = ds
+            .sql("SELECT x, y, _rowid, _rowaddr FROM foo where y > 100")
+            .table_name("foo")
+            .with_row_id(true)
+            .with_row_addr(true)
+            .build()
+            .await
+            .unwrap()
+            .into_batch_records()
+            .await
+            .unwrap();
+        let total_rows: usize = results.iter().map(|batch| batch.num_rows()).sum();
+        let expect_rows = ds.count_rows(Some("y > 100".to_string())).await.unwrap();
+        pretty_assertions::assert_eq!(total_rows, expect_rows);
+        let results = results.into_iter().next().unwrap();
+        pretty_assertions::assert_eq!(results.num_columns(), 4);
+        assert_true!(results.column(2).as_primitive::<UInt64Type>().value(0) > 100);
+        assert_true!(results.column(3).as_primitive::<UInt64Type>().value(0) > 100);
+    }
+
+    #[tokio::test]
+    async fn test_sql_explain_plan() {
+        let mut ds = gen()
+            .col("x", array::step::<Int32Type>())
+            .col("y", array::step_custom::<Int32Type>(0, 2))
+            .into_dataset(
+                "memory://test_sql_explain_plan",
+                FragmentCount::from(2),
+                FragmentRowCount::from(5),
+            )
+            .await
+            .unwrap();
+
+        let builder = ds
+            .sql("SELECT SUM(x) FROM foo WHERE y > 2")
+            .table_name("foo")
+            .build()
+            .await
+            .unwrap();
+
+        let plan = builder.into_explain_plan(true, false).await.unwrap();
+
+        assert!(plan.contains("Aggregate") || plan.contains("SUM"));
+    }
+}