From e78cf7f814f8e0df16f7197b6921d225af187231 Mon Sep 17 00:00:00 2001 From: Fangyin Cheng Date: Fri, 7 Nov 2025 16:05:56 +0800 Subject: [PATCH] fix(doc): fix batch udf with checkpoint document error --- docs/src/guide/data_evolution.md | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/docs/src/guide/data_evolution.md b/docs/src/guide/data_evolution.md index 57c739f2462..d6c7b23f674 100644 --- a/docs/src/guide/data_evolution.md +++ b/docs/src/guide/data_evolution.md @@ -95,7 +95,10 @@ dataset = lance.write_dataset(table, "ids") @lance.batch_udf(checkpoint_file="embedding_checkpoint.sqlite") def add_random_vector(batch): embeddings = np.random.rand(batch.num_rows, 128).astype("float32") - return pd.DataFrame({"embedding": embeddings}) + return pa.RecordBatch.from_arrays( + [pa.FixedSizeListArray.from_arrays(embeddings.flatten(), 128)], + names=["embedding"] + ) dataset.add_columns(add_random_vector) ```